/* * Copyright (c) 2005, 2009, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. Oracle designates this * particular file as subject to the "Classpath" exception as provided * by Oracle in the LICENSE file that accompanied this code. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA * or visit www.oracle.com if you need additional information or have any * questions. */ /* ******************************************************************************* * (C) Copyright IBM Corp. and others, 1996-2009 - All Rights Reserved * * * * The original version of this source code and documentation is copyrighted * * and owned by IBM, These materials are provided under terms of a License * * Agreement between IBM and Sun. This technology is protected by multiple * * US and International patents. This notice and attribution to IBM may not * * to removed. * ******************************************************************************* */ package sun.text.normalizer; import java.io.DataInputStream; import java.io.InputStream; import java.io.IOException; /** * <p>Internal reader class for ICU data file uprops.icu containing * Unicode codepoint data.</p> * <p>This class simply reads uprops.icu, authenticates that it is a valid * ICU data file and split its contents up into blocks of data for use in * <a href=UCharacterProperty.html>com.ibm.icu.impl.UCharacterProperty</a>. * </p> * <p>uprops.icu which is in big-endian format is jared together with this * package.</p> * * Unicode character properties file format see * (ICU4C)/source/tools/genprops/store.c * * @author Syn Wee Quek * @since release 2.1, February 1st 2002 */ final class UCharacterPropertyReader implements ICUBinary.Authenticate { // public methods ---------------------------------------------------- public boolean isDataVersionAcceptable(byte version[]) { return version[0] == DATA_FORMAT_VERSION_[0] && version[2] == DATA_FORMAT_VERSION_[2] && version[3] == DATA_FORMAT_VERSION_[3]; } // protected constructor --------------------------------------------- /** * <p>Protected constructor.</p> * @param inputStream ICU uprop.dat file input stream * @exception IOException throw if data file fails authentication */ protected UCharacterPropertyReader(InputStream inputStream) throws IOException { m_unicodeVersion_ = ICUBinary.readHeader(inputStream, DATA_FORMAT_ID_, this); m_dataInputStream_ = new DataInputStream(inputStream); } // protected methods ------------------------------------------------- /** * <p>Reads uprops.icu, parse it into blocks of data to be stored in * UCharacterProperty.</P * @param ucharppty UCharacterProperty instance * @exception IOException thrown when data reading fails */ protected void read(UCharacterProperty ucharppty) throws IOException { // read the indexes int count = INDEX_SIZE_; m_propertyOffset_ = m_dataInputStream_.readInt(); count --; m_exceptionOffset_ = m_dataInputStream_.readInt(); count --; m_caseOffset_ = m_dataInputStream_.readInt(); count --; m_additionalOffset_ = m_dataInputStream_.readInt(); count --; m_additionalVectorsOffset_ = m_dataInputStream_.readInt(); count --; m_additionalColumnsCount_ = m_dataInputStream_.readInt(); count --; m_reservedOffset_ = m_dataInputStream_.readInt(); count --; m_dataInputStream_.skipBytes(3 << 2); count -= 3; ucharppty.m_maxBlockScriptValue_ = m_dataInputStream_.readInt(); count --; // 10 ucharppty.m_maxJTGValue_ = m_dataInputStream_.readInt(); count --; // 11 m_dataInputStream_.skipBytes(count << 2); // read the trie index block // m_props_index_ in terms of ints ucharppty.m_trie_ = new CharTrie(m_dataInputStream_, null); // skip the 32 bit properties block int size = m_exceptionOffset_ - m_propertyOffset_; m_dataInputStream_.skipBytes(size * 4); // reads the 32 bit exceptions block size = m_caseOffset_ - m_exceptionOffset_; m_dataInputStream_.skipBytes(size * 4); // reads the 32 bit case block size = (m_additionalOffset_ - m_caseOffset_) << 1; m_dataInputStream_.skipBytes(size * 2); if(m_additionalColumnsCount_ > 0) { // reads the additional property block ucharppty.m_additionalTrie_ = new CharTrie(m_dataInputStream_, null); // additional properties size = m_reservedOffset_ - m_additionalVectorsOffset_; ucharppty.m_additionalVectors_ = new int[size]; for (int i = 0; i < size; i ++) { ucharppty.m_additionalVectors_[i] = m_dataInputStream_.readInt(); } } m_dataInputStream_.close(); ucharppty.m_additionalColumnsCount_ = m_additionalColumnsCount_; ucharppty.m_unicodeVersion_ = VersionInfo.getInstance( (int)m_unicodeVersion_[0], (int)m_unicodeVersion_[1], (int)m_unicodeVersion_[2], (int)m_unicodeVersion_[3]); } // private variables ------------------------------------------------- /** * Index size */ private static final int INDEX_SIZE_ = 16; /** * ICU data file input stream */ private DataInputStream m_dataInputStream_; /** * Offset information in the indexes. */ private int m_propertyOffset_; private int m_exceptionOffset_; private int m_caseOffset_; private int m_additionalOffset_; private int m_additionalVectorsOffset_; private int m_additionalColumnsCount_; private int m_reservedOffset_; private byte m_unicodeVersion_[]; /** * Data format "UPro". */ private static final byte DATA_FORMAT_ID_[] = {(byte)0x55, (byte)0x50, (byte)0x72, (byte)0x6F}; /** * Format version; this code works with all versions with the same major * version number and the same Trie bit distribution. */ private static final byte DATA_FORMAT_VERSION_[] = {(byte)0x5, (byte)0, (byte)Trie.INDEX_STAGE_1_SHIFT_, (byte)Trie.INDEX_STAGE_2_SHIFT_}; }