/* | 
|
 * Copyright (c) 2003, 2005, Oracle and/or its affiliates. All rights reserved. | 
|
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. | 
|
 * | 
|
 * This code is free software; you can redistribute it and/or modify it | 
|
 * under the terms of the GNU General Public License version 2 only, as | 
|
 * published by the Free Software Foundation.  Oracle designates this | 
|
 * particular file as subject to the "Classpath" exception as provided | 
|
 * by Oracle in the LICENSE file that accompanied this code. | 
|
 * | 
|
 * This code is distributed in the hope that it will be useful, but WITHOUT | 
|
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | 
|
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License | 
|
 * version 2 for more details (a copy is included in the LICENSE file that | 
|
 * accompanied this code). | 
|
 * | 
|
 * You should have received a copy of the GNU General Public License version | 
|
 * 2 along with this work; if not, write to the Free Software Foundation, | 
|
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. | 
|
 * | 
|
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA | 
|
 * or visit www.oracle.com if you need additional information or have any | 
|
 * questions. | 
|
*/  | 
|
/*  | 
|
*******************************************************************************  | 
|
* (C) Copyright IBM Corp. 1996-2005 - All Rights Reserved *  | 
|
* *  | 
|
* The original version of this source code and documentation is copyrighted *  | 
|
* and owned by IBM, These materials are provided under terms of a License *  | 
|
* Agreement between IBM and Sun. This technology is protected by multiple *  | 
|
* US and International patents. This notice and attribution to IBM may not *  | 
|
* to removed. *  | 
|
*******************************************************************************  | 
|
*/  | 
|
package sun.text.normalizer;  | 
|
import java.io.InputStream;  | 
|
import java.io.DataInputStream;  | 
|
import java.io.IOException;  | 
|
import java.util.Arrays;  | 
|
/** | 
|
 * Trie implementation which stores data in int, 32 bits. | 
|
 * @author synwee | 
|
 * @see com.ibm.icu.impl.Trie | 
|
 * @since release 2.1, Jan 01 2002 | 
|
*/  | 
|
public class IntTrie extends Trie  | 
|
{ | 
|
// public constructors ---------------------------------------------  | 
|
    /** | 
|
    * <p>Creates a new Trie with the settings for the trie data.</p> | 
|
    * <p>Unserialize the 32-bit-aligned input stream and use the data for the | 
|
    * trie.</p> | 
|
    * @param inputStream file input stream to a ICU data file, containing | 
|
    *                    the trie | 
|
    * @param dataManipulate object which provides methods to parse the char | 
|
    *                        data | 
|
    * @throws IOException thrown when data reading fails | 
|
    * @draft 2.1 | 
|
*/  | 
|
public IntTrie(InputStream inputStream, DataManipulate datamanipulate)  | 
|
throws IOException  | 
|
    { | 
|
super(inputStream, datamanipulate);  | 
|
if (!isIntTrie()) {  | 
|
throw new IllegalArgumentException(  | 
|
                               "Data given does not belong to a int trie."); | 
|
}  | 
|
}  | 
|
// public methods --------------------------------------------------  | 
|
    /** | 
|
    * Gets the value associated with the codepoint. | 
|
    * If no value is associated with the codepoint, a default value will be | 
|
    * returned. | 
|
    * @param ch codepoint | 
|
    * @return offset to data | 
|
    * @draft 2.1 | 
|
*/  | 
|
public final int getCodePointValue(int ch)  | 
|
    { | 
|
int offset = getCodePointOffset(ch);  | 
|
return (offset >= 0) ? m_data_[offset] : m_initialValue_;  | 
|
}  | 
|
    /** | 
|
    * Gets the value to the data which this lead surrogate character points | 
|
    * to. | 
|
    * Returned data may contain folding offset information for the next | 
|
    * trailing surrogate character. | 
|
    * This method does not guarantee correct results for trail surrogates. | 
|
    * @param ch lead surrogate character | 
|
    * @return data value | 
|
    * @draft 2.1 | 
|
*/  | 
|
public final int getLeadValue(char ch)  | 
|
    { | 
|
return m_data_[getLeadOffset(ch)];  | 
|
}  | 
|
    /** | 
|
    * Get a value from a folding offset (from the value of a lead surrogate) | 
|
    * and a trail surrogate. | 
|
    * @param leadvalue the value of a lead surrogate that contains the | 
|
    *        folding offset | 
|
    * @param trail surrogate | 
|
    * @return trie data value associated with the trail character | 
|
    * @draft 2.1 | 
|
*/  | 
|
public final int getTrailValue(int leadvalue, char trail)  | 
|
    { | 
|
        if (m_dataManipulate_ == null) { | 
|
throw new NullPointerException(  | 
|
                             "The field DataManipulate in this Trie is null"); | 
|
}  | 
|
int offset = m_dataManipulate_.getFoldingOffset(leadvalue);  | 
|
if (offset > 0) {  | 
|
return m_data_[getRawOffset(offset,  | 
|
(char)(trail & SURROGATE_MASK_))];  | 
|
}  | 
|
return m_initialValue_;  | 
|
}  | 
|
// protected methods -----------------------------------------------  | 
|
    /** | 
|
    * <p>Parses the input stream and stores its trie content into a index and | 
|
    * data array</p> | 
|
    * @param inputStream data input stream containing trie data | 
|
    * @exception IOException thrown when data reading fails | 
|
*/  | 
|
protected final void unserialize(InputStream inputStream)  | 
|
throws IOException  | 
|
    { | 
|
super.unserialize(inputStream);  | 
|
        // one used for initial value | 
|
m_data_ = new int[m_dataLength_];  | 
|
DataInputStream input = new DataInputStream(inputStream);  | 
|
for (int i = 0; i < m_dataLength_; i ++) {  | 
|
m_data_[i] = input.readInt();  | 
|
}  | 
|
m_initialValue_ = m_data_[0];  | 
|
}  | 
|
    /** | 
|
    * Gets the offset to the data which the surrogate pair points to. | 
|
    * @param lead lead surrogate | 
|
    * @param trail trailing surrogate | 
|
    * @return offset to data | 
|
    * @draft 2.1 | 
|
*/  | 
|
protected final int getSurrogateOffset(char lead, char trail)  | 
|
    { | 
|
        if (m_dataManipulate_ == null) { | 
|
throw new NullPointerException(  | 
|
                             "The field DataManipulate in this Trie is null"); | 
|
}  | 
|
        // get fold position for the next trail surrogate | 
|
int offset = m_dataManipulate_.getFoldingOffset(getLeadValue(lead));  | 
|
        // get the real data from the folded lead/trail units | 
|
if (offset > 0) {  | 
|
return getRawOffset(offset, (char)(trail & SURROGATE_MASK_));  | 
|
}  | 
|
// return -1 if there is an error, in this case we return the default  | 
|
        // value: m_initialValue_ | 
|
return -1;  | 
|
}  | 
|
    /** | 
|
    * Gets the value at the argument index. | 
|
    * For use internally in TrieIterator | 
|
    * @param index value at index will be retrieved | 
|
    * @return 32 bit value | 
|
    * @see com.ibm.icu.impl.TrieIterator | 
|
    * @draft 2.1 | 
|
*/  | 
|
protected final int getValue(int index)  | 
|
    { | 
|
return m_data_[index];  | 
|
}  | 
|
    /** | 
|
    * Gets the default initial value | 
|
    * @return 32 bit value | 
|
    * @draft 2.1 | 
|
*/  | 
|
protected final int getInitialValue()  | 
|
    { | 
|
return m_initialValue_;  | 
|
}  | 
|
// package private methods -----------------------------------------  | 
|
    /** | 
|
     * Internal constructor for builder use | 
|
     * @param index the index array to be slotted into this trie | 
|
     * @param data the data array to be slotted into this trie | 
|
     * @param initialvalue the initial value for this trie | 
|
     * @param options trie options to use | 
|
     * @param datamanipulate folding implementation | 
|
*/  | 
|
IntTrie(char index[], int data[], int initialvalue, int options,  | 
|
DataManipulate datamanipulate)  | 
|
    { | 
|
super(index, options, datamanipulate);  | 
|
m_data_ = data;  | 
|
m_dataLength_ = m_data_.length;  | 
|
m_initialValue_ = initialvalue;  | 
|
}  | 
|
// private data members --------------------------------------------  | 
|
    /** | 
|
    * Default value | 
|
*/  | 
|
private int m_initialValue_;  | 
|
    /** | 
|
    * Array of char data | 
|
*/  | 
|
private int m_data_[];  | 
|
}  |