/* * Copyright (c) 1999, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. Oracle designates this * particular file as subject to the "Classpath" exception as provided * by Oracle in the LICENSE file that accompanied this code. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA * or visit www.oracle.com if you need additional information or have any * questions. */ package sun.io; import sun.nio.cs.ext.ISCII91; /* * Copyright (c) 1998 International Business Machines. * All Rights Reserved. * * Author : Sunanda Bera, C. Thirumalesh * Last Modified : 23,November,1998 * * Purpose : Defines class ByteToCharISCII91. * * * Revision History * ======== ======= * * Date By Description * ---- -- ----------- * * */ /** * Converter class. Converts between Unicode encoding and ISCII91 encoding. * ISCII91 is the character encoding as defined in Indian Standard document * IS 13194:1991 ( Indian Script Code for Information Interchange ). * * @see sun.io.ByteToCharConverter */ public class ByteToCharISCII91 extends ByteToCharConverter { private static final char[] directMapTable = ISCII91.getDirectMapTable(); private static final char NUKTA_CHAR = '\u093c'; private static final char HALANT_CHAR = '\u094d'; private static final char ZWNJ_CHAR = '\u200c'; private static final char ZWJ_CHAR = '\u200d'; private static final char INVALID_CHAR = '\uffff'; private char contextChar = INVALID_CHAR; private boolean needFlushing = false; /** * Converts ISCII91 characters to Unicode. * @see sun.io.ByteToCharConverter#convert */ public int convert(byte input[], int inStart, int inEnd, char output[], int outStart, int outEnd) throws ConversionBufferFullException, UnknownCharacterException { /*Rules: * 1)ATR,EXT,following character to be replaced with '\ufffd' * 2)Halant + Halant => '\u094d' (Virama) + '\u200c'(ZWNJ) * 3)Halant + Nukta => '\u094d' (Virama) + '\u200d'(ZWJ) */ charOff = outStart; byteOff = inStart; while (byteOff < inEnd) { if (charOff >= outEnd) { throw new ConversionBufferFullException(); } int index = input[byteOff++]; index = ( index < 0 )? ( index + 255 ):index; char currentChar = directMapTable[index]; // if the contextChar is either ATR || EXT set the output to '\ufffd' if(contextChar == '\ufffd') { output[charOff++] = '\ufffd'; contextChar = INVALID_CHAR; needFlushing = false; continue; } switch(currentChar) { case '\u0901': case '\u0907': case '\u0908': case '\u090b': case '\u093f': case '\u0940': case '\u0943': case '\u0964': if(needFlushing) { output[charOff++] = contextChar; contextChar = currentChar; continue; } contextChar = currentChar; needFlushing = true; continue; case NUKTA_CHAR: switch(contextChar) { case '\u0901': output[charOff] = '\u0950'; break; case '\u0907': output[charOff] = '\u090c'; break; case '\u0908': output[charOff] = '\u0961'; break; case '\u090b': output[charOff] = '\u0960'; break; case '\u093f': output[charOff] = '\u0962'; break; case '\u0940': output[charOff] = '\u0963'; break; case '\u0943': output[charOff] = '\u0944'; break; case '\u0964': output[charOff] = '\u093d'; break; case HALANT_CHAR: if(needFlushing) { output[charOff++] = contextChar; contextChar = currentChar; continue; } output[charOff] = ZWJ_CHAR; break; default: if(needFlushing) { output[charOff++] = contextChar; contextChar = currentChar; continue; } output[charOff] = NUKTA_CHAR; } break; case HALANT_CHAR: if(needFlushing) { output[charOff++] = contextChar; contextChar = currentChar; continue; } if(contextChar == HALANT_CHAR) { output[charOff] = ZWNJ_CHAR; break; } output[charOff] = HALANT_CHAR; break; case INVALID_CHAR: if(needFlushing) { output[charOff++] = contextChar; contextChar = currentChar; continue; } if(subMode) { output[charOff] = subChars[0]; break; } else { contextChar = INVALID_CHAR; throw new UnknownCharacterException(); } default: if(needFlushing) { output[charOff++] = contextChar; contextChar = currentChar; continue; } output[charOff] = currentChar; break; }//end switch contextChar = currentChar; needFlushing = false; charOff++; }//end while return charOff - outStart; } //convert() /** * @see sun.io.ByteToCharConverter#flush */ public int flush( char[] output, int outStart, int outEnd ) throws MalformedInputException, ConversionBufferFullException { int charsWritten = 0; //if the last char was not flushed, flush it! if(needFlushing) { output[outStart] = contextChar; charsWritten = 1; } contextChar = INVALID_CHAR; needFlushing = false; byteOff = charOff = 0; return charsWritten; }//flush() /** * Returns the character set id for the conversion. */ public String getCharacterEncoding() { return "ISCII91"; }//getCharacterEncoding() /** * @see sun.io.ByteToCharConverter#reset */ public void reset() { byteOff = charOff = 0; }//reset() }//end of class definition