/*
* Copyright (c) 1999, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation. Oracle designates this
* particular file as subject to the "Classpath" exception as provided
* by Oracle in the LICENSE file that accompanied this code.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*/
package sun.io;
import sun.nio.cs.ext.ISCII91;
/*
* Copyright (c) 1998 International Business Machines.
* All Rights Reserved.
*
* Author : Sunanda Bera, C. Thirumalesh
* Last Modified : 23,November,1998
*
* Purpose : Defines class ByteToCharISCII91.
*
*
* Revision History
* ======== =======
*
* Date By Description
* ---- -- -----------
*
*
*/
Converter class. Converts between Unicode encoding and ISCII91 encoding.
ISCII91 is the character encoding as defined in Indian Standard document
IS 13194:1991 ( Indian Script Code for Information Interchange ).
See Also: - ByteToCharConverter
/**
* Converter class. Converts between Unicode encoding and ISCII91 encoding.
* ISCII91 is the character encoding as defined in Indian Standard document
* IS 13194:1991 ( Indian Script Code for Information Interchange ).
*
* @see sun.io.ByteToCharConverter
*/
public class ByteToCharISCII91 extends ByteToCharConverter {
private static final char[] directMapTable = ISCII91.getDirectMapTable();
private static final char NUKTA_CHAR = '\u093c';
private static final char HALANT_CHAR = '\u094d';
private static final char ZWNJ_CHAR = '\u200c';
private static final char ZWJ_CHAR = '\u200d';
private static final char INVALID_CHAR = '\uffff';
private char contextChar = INVALID_CHAR;
private boolean needFlushing = false;
Converts ISCII91 characters to Unicode.
See Also: - convert.convert
/**
* Converts ISCII91 characters to Unicode.
* @see sun.io.ByteToCharConverter#convert
*/
public int convert(byte input[], int inStart, int inEnd,
char output[], int outStart, int outEnd)
throws ConversionBufferFullException, UnknownCharacterException {
/*Rules:
* 1)ATR,EXT,following character to be replaced with '\ufffd'
* 2)Halant + Halant => '\u094d' (Virama) + '\u200c'(ZWNJ)
* 3)Halant + Nukta => '\u094d' (Virama) + '\u200d'(ZWJ)
*/
charOff = outStart;
byteOff = inStart;
while (byteOff < inEnd) {
if (charOff >= outEnd) {
throw new ConversionBufferFullException();
}
int index = input[byteOff++];
index = ( index < 0 )? ( index + 255 ):index;
char currentChar = directMapTable[index];
// if the contextChar is either ATR || EXT set the output to '\ufffd'
if(contextChar == '\ufffd') {
output[charOff++] = '\ufffd';
contextChar = INVALID_CHAR;
needFlushing = false;
continue;
}
switch(currentChar) {
case '\u0901':
case '\u0907':
case '\u0908':
case '\u090b':
case '\u093f':
case '\u0940':
case '\u0943':
case '\u0964':
if(needFlushing) {
output[charOff++] = contextChar;
contextChar = currentChar;
continue;
}
contextChar = currentChar;
needFlushing = true;
continue;
case NUKTA_CHAR:
switch(contextChar) {
case '\u0901':
output[charOff] = '\u0950';
break;
case '\u0907':
output[charOff] = '\u090c';
break;
case '\u0908':
output[charOff] = '\u0961';
break;
case '\u090b':
output[charOff] = '\u0960';
break;
case '\u093f':
output[charOff] = '\u0962';
break;
case '\u0940':
output[charOff] = '\u0963';
break;
case '\u0943':
output[charOff] = '\u0944';
break;
case '\u0964':
output[charOff] = '\u093d';
break;
case HALANT_CHAR:
if(needFlushing) {
output[charOff++] = contextChar;
contextChar = currentChar;
continue;
}
output[charOff] = ZWJ_CHAR;
break;
default:
if(needFlushing) {
output[charOff++] = contextChar;
contextChar = currentChar;
continue;
}
output[charOff] = NUKTA_CHAR;
}
break;
case HALANT_CHAR:
if(needFlushing) {
output[charOff++] = contextChar;
contextChar = currentChar;
continue;
}
if(contextChar == HALANT_CHAR) {
output[charOff] = ZWNJ_CHAR;
break;
}
output[charOff] = HALANT_CHAR;
break;
case INVALID_CHAR:
if(needFlushing) {
output[charOff++] = contextChar;
contextChar = currentChar;
continue;
}
if(subMode) {
output[charOff] = subChars[0];
break;
} else {
contextChar = INVALID_CHAR;
throw new UnknownCharacterException();
}
default:
if(needFlushing) {
output[charOff++] = contextChar;
contextChar = currentChar;
continue;
}
output[charOff] = currentChar;
break;
}//end switch
contextChar = currentChar;
needFlushing = false;
charOff++;
}//end while
return charOff - outStart;
} //convert()
See Also: - flush.flush
/**
* @see sun.io.ByteToCharConverter#flush
*/
public int flush( char[] output, int outStart, int outEnd )
throws MalformedInputException, ConversionBufferFullException
{
int charsWritten = 0;
//if the last char was not flushed, flush it!
if(needFlushing) {
output[outStart] = contextChar;
charsWritten = 1;
}
contextChar = INVALID_CHAR;
needFlushing = false;
byteOff = charOff = 0;
return charsWritten;
}//flush()
Returns the character set id for the conversion.
/**
* Returns the character set id for the conversion.
*/
public String getCharacterEncoding()
{
return "ISCII91";
}//getCharacterEncoding()
See Also: - reset.reset
/**
* @see sun.io.ByteToCharConverter#reset
*/
public void reset()
{
byteOff = charOff = 0;
}//reset()
}//end of class definition