main/classes/core/src/com/ibm/icu/impl/UCharacterNameReader.java - external/github.com/unicode-org/icu - Git at Google

 /**
 *******************************************************************************
 * Copyright (C) 1996-2010, International Business Machines Corporation and    *
 * others. All Rights Reserved.                                                *
 *******************************************************************************
 */
 package com.ibm.icu.impl;

 import java.io.DataInputStream;
 import java.io.IOException;
 import java.io.InputStream;
 import java.util.Arrays;

 /**
 * <p>Internal reader class for ICU data file uname.dat containing
 * Unicode codepoint name data.</p>
 * <p>This class simply reads unames.icu, authenticates that it is a valid
 * ICU data file and split its contents up into blocks of data for use in
 * <a href=UCharacterName.html>com.ibm.icu.impl.UCharacterName</a>.
 * </p>
 * <p>unames.icu which is in big-endian format is jared together with this
 * package.</p>
 * @author Syn Wee Quek
 * @since release 2.1, February 1st 2002
 */

 final class UCharacterNameReader implements ICUBinary.Authenticate
 {
     // public methods ----------------------------------------------------

     public boolean isDataVersionAcceptable(byte version[])
     {
         return version[0] == DATA_FORMAT_VERSION_[0];
     }

     // protected constructor ---------------------------------------------

     /**
     * <p>Protected constructor.</p>
     * @param inputStream ICU uprop.dat file input stream
     * @exception IOException throw if data file fails authentication
     */
     protected UCharacterNameReader(InputStream inputStream)
                                                         throws IOException
     {
         ICUBinary.readHeader(inputStream, DATA_FORMAT_ID_, this);
         m_dataInputStream_ = new DataInputStream(inputStream);
     }

     // protected methods -------------------------------------------------

     /**
     * Read and break up the stream of data passed in as arguments
     * and fills up UCharacterName.
     * If unsuccessful false will be returned.
     * @param data instance of datablock
     * @exception IOException thrown when there's a data error.
     */
     protected void read(UCharacterName data) throws IOException
     {
         // reading index
         m_tokenstringindex_ = m_dataInputStream_.readInt();
         m_groupindex_       = m_dataInputStream_.readInt();
         m_groupstringindex_ = m_dataInputStream_.readInt();
         m_algnamesindex_    = m_dataInputStream_.readInt();

         // reading tokens
         int count = m_dataInputStream_.readChar();
         char token[] = new char[count];
         for (char i = 0; i < count; i ++) {
             token[i] = m_dataInputStream_.readChar();
         }
         int size = m_groupindex_ - m_tokenstringindex_;
         byte tokenstr[] = new byte[size];
         m_dataInputStream_.readFully(tokenstr);
         data.setToken(token, tokenstr);

         // reading the group information records
         count = m_dataInputStream_.readChar();
         data.setGroupCountSize(count, GROUP_INFO_SIZE_);
         count *= GROUP_INFO_SIZE_;
         char group[] = new char[count];
         for (int i = 0; i < count; i ++) {
             group[i] = m_dataInputStream_.readChar();
         }

         size = m_algnamesindex_ - m_groupstringindex_;
         byte groupstring[] = new byte[size];
         m_dataInputStream_.readFully(groupstring);

         data.setGroup(group, groupstring);

         count = m_dataInputStream_.readInt();
         UCharacterName.AlgorithmName alg[] =
                                  new UCharacterName.AlgorithmName[count];

         for (int i = 0; i < count; i ++)
         {
             UCharacterName.AlgorithmName an = readAlg();
             if (an == null) {
                 throw new IOException("unames.icu read error: Algorithmic names creation error");
             }
             alg[i] = an;
         }
         data.setAlgorithm(alg);
     }

     /**
     * <p>Checking the file for the correct format.</p>
     * @param dataformatid
     * @param dataformatversion
     * @return true if the file format version is correct
     */
     ///CLOVER:OFF
     protected boolean authenticate(byte dataformatid[],
                                    byte dataformatversion[])
     {
         return Arrays.equals(DATA_FORMAT_ID_, dataformatid) &&
                Arrays.equals(DATA_FORMAT_VERSION_, dataformatversion);
     }
     ///CLOVER:ON

     // private variables -------------------------------------------------

     /**
     * Data input stream for names
     */
     private DataInputStream m_dataInputStream_;
     /**
     * Size of the group information block in number of char
     */
     private static final int GROUP_INFO_SIZE_ = 3;

     /**
     * Index of the offset information
     */
     private int m_tokenstringindex_;
     private int m_groupindex_;
     private int m_groupstringindex_;
     private int m_algnamesindex_;

     /**
     * Size of an algorithmic name information group
     * start code point size + end code point size + type size + variant size +
     * size of data size
     */
     private static final int ALG_INFO_SIZE_ = 12;

     /**
     * File format version and id that this class understands.
     * No guarantees are made if a older version is used
     */
     private static final byte DATA_FORMAT_VERSION_[] =
                                     {(byte)0x1, (byte)0x0, (byte)0x0, (byte)0x0};
     private static final byte DATA_FORMAT_ID_[] = {(byte)0x75, (byte)0x6E,
                                                     (byte)0x61, (byte)0x6D};

     // private methods ---------------------------------------------------

     /**
     * Reads an individual record of AlgorithmNames
     * @return an instance of AlgorithNames if read is successful otherwise null
     * @exception IOException thrown when file read error occurs or data is corrupted
     */
     private UCharacterName.AlgorithmName readAlg() throws IOException
     {
         UCharacterName.AlgorithmName result =
                                        new UCharacterName.AlgorithmName();
         int rangestart = m_dataInputStream_.readInt();
         int rangeend   = m_dataInputStream_.readInt();
         byte type      = m_dataInputStream_.readByte();
         byte variant   = m_dataInputStream_.readByte();
         if (!result.setInfo(rangestart, rangeend, type, variant)) {
             return null;
         }

         int size = m_dataInputStream_.readChar();
         if (type == UCharacterName.AlgorithmName.TYPE_1_)
         {
             char factor[] = new char[variant];
             for (int j = 0; j < variant; j ++) {
                 factor[j] = m_dataInputStream_.readChar();
             }

             result.setFactor(factor);
             size -= (variant << 1);
         }

         StringBuilder prefix = new StringBuilder();
         char c = (char)(m_dataInputStream_.readByte() & 0x00FF);
         while (c != 0)
         {
             prefix.append(c);
             c = (char)(m_dataInputStream_.readByte() & 0x00FF);
         }

         result.setPrefix(prefix.toString());

         size -= (ALG_INFO_SIZE_ + prefix.length() + 1);

         if (size > 0)
         {
             byte string[] = new byte[size];
             m_dataInputStream_.readFully(string);
             result.setFactorString(string);
         }
         return result;
     }
 }
	/**
	*******************************************************************************
	* Copyright (C) 1996-2010, International Business Machines Corporation and *
	* others. All Rights Reserved. *
	*******************************************************************************
	*/
	package com.ibm.icu.impl;

	import java.io.DataInputStream;
	import java.io.IOException;
	import java.io.InputStream;
	import java.util.Arrays;

	/**
	* <p>Internal reader class for ICU data file uname.dat containing
	* Unicode codepoint name data.</p>
	* <p>This class simply reads unames.icu, authenticates that it is a valid
	* ICU data file and split its contents up into blocks of data for use in
	* <a href=UCharacterName.html>com.ibm.icu.impl.UCharacterName</a>.
	* </p>
	* <p>unames.icu which is in big-endian format is jared together with this
	* package.</p>
	* @author Syn Wee Quek
	* @since release 2.1, February 1st 2002
	*/

	final class UCharacterNameReader implements ICUBinary.Authenticate
	{
	// public methods ----------------------------------------------------

	public boolean isDataVersionAcceptable(byte version[])
	{
	return version[0] == DATA_FORMAT_VERSION_[0];
	}

	// protected constructor ---------------------------------------------

	/**
	* <p>Protected constructor.</p>
	* @param inputStream ICU uprop.dat file input stream
	* @exception IOException throw if data file fails authentication
	*/
	protected UCharacterNameReader(InputStream inputStream)
	throws IOException
	{
	ICUBinary.readHeader(inputStream, DATA_FORMAT_ID_, this);
	m_dataInputStream_ = new DataInputStream(inputStream);
	}

	// protected methods -------------------------------------------------

	/**
	* Read and break up the stream of data passed in as arguments
	* and fills up UCharacterName.
	* If unsuccessful false will be returned.
	* @param data instance of datablock
	* @exception IOException thrown when there's a data error.
	*/
	protected void read(UCharacterName data) throws IOException
	{
	// reading index
	m_tokenstringindex_ = m_dataInputStream_.readInt();
	m_groupindex_ = m_dataInputStream_.readInt();
	m_groupstringindex_ = m_dataInputStream_.readInt();
	m_algnamesindex_ = m_dataInputStream_.readInt();

	// reading tokens
	int count = m_dataInputStream_.readChar();
	char token[] = new char[count];
	for (char i = 0; i < count; i ++) {
	token[i] = m_dataInputStream_.readChar();
	}
	int size = m_groupindex_ - m_tokenstringindex_;
	byte tokenstr[] = new byte[size];
	m_dataInputStream_.readFully(tokenstr);
	data.setToken(token, tokenstr);

	// reading the group information records
	count = m_dataInputStream_.readChar();
	data.setGroupCountSize(count, GROUP_INFO_SIZE_);
	count *= GROUP_INFO_SIZE_;
	char group[] = new char[count];
	for (int i = 0; i < count; i ++) {
	group[i] = m_dataInputStream_.readChar();
	}

	size = m_algnamesindex_ - m_groupstringindex_;
	byte groupstring[] = new byte[size];
	m_dataInputStream_.readFully(groupstring);

	data.setGroup(group, groupstring);

	count = m_dataInputStream_.readInt();
	UCharacterName.AlgorithmName alg[] =
	new UCharacterName.AlgorithmName[count];

	for (int i = 0; i < count; i ++)
	{
	UCharacterName.AlgorithmName an = readAlg();
	if (an == null) {
	throw new IOException("unames.icu read error: Algorithmic names creation error");
	}
	alg[i] = an;
	}
	data.setAlgorithm(alg);
	}

	/**
	* <p>Checking the file for the correct format.</p>
	* @param dataformatid
	* @param dataformatversion
	* @return true if the file format version is correct
	*/
	///CLOVER:OFF
	protected boolean authenticate(byte dataformatid[],
	byte dataformatversion[])
	{
	return Arrays.equals(DATA_FORMAT_ID_, dataformatid) &&
	Arrays.equals(DATA_FORMAT_VERSION_, dataformatversion);
	}
	///CLOVER:ON

	// private variables -------------------------------------------------

	/**
	* Data input stream for names
	*/
	private DataInputStream m_dataInputStream_;
	/**
	* Size of the group information block in number of char
	*/
	private static final int GROUP_INFO_SIZE_ = 3;

	/**
	* Index of the offset information
	*/
	private int m_tokenstringindex_;
	private int m_groupindex_;
	private int m_groupstringindex_;
	private int m_algnamesindex_;

	/**
	* Size of an algorithmic name information group
	* start code point size + end code point size + type size + variant size +
	* size of data size
	*/
	private static final int ALG_INFO_SIZE_ = 12;

	/**
	* File format version and id that this class understands.
	* No guarantees are made if a older version is used
	*/
	private static final byte DATA_FORMAT_VERSION_[] =
	{(byte)0x1, (byte)0x0, (byte)0x0, (byte)0x0};
	private static final byte DATA_FORMAT_ID_[] = {(byte)0x75, (byte)0x6E,
	(byte)0x61, (byte)0x6D};

	// private methods ---------------------------------------------------

	/**
	* Reads an individual record of AlgorithmNames
	* @return an instance of AlgorithNames if read is successful otherwise null
	* @exception IOException thrown when file read error occurs or data is corrupted
	*/
	private UCharacterName.AlgorithmName readAlg() throws IOException
	{
	UCharacterName.AlgorithmName result =
	new UCharacterName.AlgorithmName();
	int rangestart = m_dataInputStream_.readInt();
	int rangeend = m_dataInputStream_.readInt();
	byte type = m_dataInputStream_.readByte();
	byte variant = m_dataInputStream_.readByte();
	if (!result.setInfo(rangestart, rangeend, type, variant)) {
	return null;
	}

	int size = m_dataInputStream_.readChar();
	if (type == UCharacterName.AlgorithmName.TYPE_1_)
	{
	char factor[] = new char[variant];
	for (int j = 0; j < variant; j ++) {
	factor[j] = m_dataInputStream_.readChar();
	}

	result.setFactor(factor);
	size -= (variant << 1);
	}

	StringBuilder prefix = new StringBuilder();
	char c = (char)(m_dataInputStream_.readByte() & 0x00FF);
	while (c != 0)
	{
	prefix.append(c);
	c = (char)(m_dataInputStream_.readByte() & 0x00FF);
	}

	result.setPrefix(prefix.toString());

	size -= (ALG_INFO_SIZE_ + prefix.length() + 1);

	if (size > 0)
	{
	byte string[] = new byte[size];
	m_dataInputStream_.readFully(string);
	result.setFactorString(string);
	}
	return result;
	}
	}