/** ******************************************************************************* * Copyright (C) 1996-2010, International Business Machines Corporation and * * others. All Rights Reserved. * ******************************************************************************* */ package com.ibm.icu.impl; import java.io.DataInputStream; import java.io.IOException; import java.io.InputStream; import java.util.Arrays; /** *

Internal reader class for ICU data file uname.dat containing * Unicode codepoint name data.

This class simply reads unames.icu, authenticates that it is a valid * ICU data file and split its contents up into blocks of data for use in * com.ibm.icu.impl.UCharacterName. *

unames.icu which is in big-endian format is jared together with this * package.

* @author Syn Wee Quek * @since release 2.1, February 1st 2002 */ final class UCharacterNameReader implements ICUBinary.Authenticate { // public methods ---------------------------------------------------- public boolean isDataVersionAcceptable(byte version[]) { return version[0] == DATA_FORMAT_VERSION_[0]; } // protected constructor --------------------------------------------- /** *

Protected constructor.

* @param inputStream ICU uprop.dat file input stream * @exception IOException throw if data file fails authentication */ protected UCharacterNameReader(InputStream inputStream) throws IOException { ICUBinary.readHeader(inputStream, DATA_FORMAT_ID_, this); m_dataInputStream_ = new DataInputStream(inputStream); } // protected methods ------------------------------------------------- /** * Read and break up the stream of data passed in as arguments * and fills up UCharacterName. * If unsuccessful false will be returned. * @param data instance of datablock * @exception IOException thrown when there's a data error. */ protected void read(UCharacterName data) throws IOException { // reading index m_tokenstringindex_ = m_dataInputStream_.readInt(); m_groupindex_ = m_dataInputStream_.readInt(); m_groupstringindex_ = m_dataInputStream_.readInt(); m_algnamesindex_ = m_dataInputStream_.readInt(); // reading tokens int count = m_dataInputStream_.readChar(); char token[] = new char[count]; for (char i = 0; i < count; i ++) { token[i] = m_dataInputStream_.readChar(); } int size = m_groupindex_ - m_tokenstringindex_; byte tokenstr[] = new byte[size]; m_dataInputStream_.readFully(tokenstr); data.setToken(token, tokenstr); // reading the group information records count = m_dataInputStream_.readChar(); data.setGroupCountSize(count, GROUP_INFO_SIZE_); count *= GROUP_INFO_SIZE_; char group[] = new char[count]; for (int i = 0; i < count; i ++) { group[i] = m_dataInputStream_.readChar(); } size = m_algnamesindex_ - m_groupstringindex_; byte groupstring[] = new byte[size]; m_dataInputStream_.readFully(groupstring); data.setGroup(group, groupstring); count = m_dataInputStream_.readInt(); UCharacterName.AlgorithmName alg[] = new UCharacterName.AlgorithmName[count]; for (int i = 0; i < count; i ++) { UCharacterName.AlgorithmName an = readAlg(); if (an == null) { throw new IOException("unames.icu read error: Algorithmic names creation error"); } alg[i] = an; } data.setAlgorithm(alg); } /** *

Checking the file for the correct format.

* @param dataformatid * @param dataformatversion * @return true if the file format version is correct */ ///CLOVER:OFF protected boolean authenticate(byte dataformatid[], byte dataformatversion[]) { return Arrays.equals(DATA_FORMAT_ID_, dataformatid) && Arrays.equals(DATA_FORMAT_VERSION_, dataformatversion); } ///CLOVER:ON // private variables ------------------------------------------------- /** * Data input stream for names */ private DataInputStream m_dataInputStream_; /** * Size of the group information block in number of char */ private static final int GROUP_INFO_SIZE_ = 3; /** * Index of the offset information */ private int m_tokenstringindex_; private int m_groupindex_; private int m_groupstringindex_; private int m_algnamesindex_; /** * Size of an algorithmic name information group * start code point size + end code point size + type size + variant size + * size of data size */ private static final int ALG_INFO_SIZE_ = 12; /** * File format version and id that this class understands. * No guarantees are made if a older version is used */ private static final byte DATA_FORMAT_VERSION_[] = {(byte)0x1, (byte)0x0, (byte)0x0, (byte)0x0}; private static final byte DATA_FORMAT_ID_[] = {(byte)0x75, (byte)0x6E, (byte)0x61, (byte)0x6D}; // private methods --------------------------------------------------- /** * Reads an individual record of AlgorithmNames * @return an instance of AlgorithNames if read is successful otherwise null * @exception IOException thrown when file read error occurs or data is corrupted */ private UCharacterName.AlgorithmName readAlg() throws IOException { UCharacterName.AlgorithmName result = new UCharacterName.AlgorithmName(); int rangestart = m_dataInputStream_.readInt(); int rangeend = m_dataInputStream_.readInt(); byte type = m_dataInputStream_.readByte(); byte variant = m_dataInputStream_.readByte(); if (!result.setInfo(rangestart, rangeend, type, variant)) { return null; } int size = m_dataInputStream_.readChar(); if (type == UCharacterName.AlgorithmName.TYPE_1_) { char factor[] = new char[variant]; for (int j = 0; j < variant; j ++) { factor[j] = m_dataInputStream_.readChar(); } result.setFactor(factor); size -= (variant << 1); } StringBuilder prefix = new StringBuilder(); char c = (char)(m_dataInputStream_.readByte() & 0x00FF); while (c != 0) { prefix.append(c); c = (char)(m_dataInputStream_.readByte() & 0x00FF); } result.setPrefix(prefix.toString()); size -= (ALG_INFO_SIZE_ + prefix.length() + 1); if (size > 0) { byte string[] = new byte[size]; m_dataInputStream_.readFully(string); result.setFactorString(string); } return result; } }