/*
 * Copyright (c) 1996, 2004, Oracle and/or its affiliates. All rights reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.  Oracle designates this
 * particular file as subject to the "Classpath" exception as provided
 * by Oracle in the LICENSE file that accompanied this code.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 * or visit www.oracle.com if you need additional information or have any
 * questions.
 */

package sun.io;

import sun.nio.cs.ext.EUC_TW;

/*
 * @author Limin Shi
 */
public class ByteToCharEUC_TW extends ByteToCharConverter
{
    private final byte G0 = 0;
    private final byte G1 = 1;
    private final byte G2 = 2;
    private final byte G3 = 3;
    private final byte G4 = 4;
    private final byte MSB = (byte) 0x80;
    private final byte SS2 = (byte) 0x8E;
    private final byte P2 = (byte) 0xA2;
    private final byte P3 = (byte) 0xA3;

    protected final char REPLACE_CHAR = '\uFFFD';

    private byte firstByte = 0, state = G0;
    public static String unicodeCNS2, unicodeCNS3;
    private static String unicodeCNS4, unicodeCNS5, unicodeCNS6;
    private static String unicodeCNS7, unicodeCNS15;

    private int cnsPlane = 0;
    private final static EUC_TW nioCoder = new EUC_TW();

    public static String unicodeCNS1 = nioCoder.getUnicodeCNS1();

        static String[] cnsChars = {
            unicodeCNS2 = nioCoder.getUnicodeCNS2(),
            unicodeCNS3 = nioCoder.getUnicodeCNS3(),
            unicodeCNS4 = nioCoder.getUnicodeCNS4(),
            unicodeCNS5 = nioCoder.getUnicodeCNS5(),
            unicodeCNS6 = nioCoder.getUnicodeCNS6(),
            unicodeCNS7 = nioCoder.getUnicodeCNS7(),
            unicodeCNS15 = nioCoder.getUnicodeCNS15()
            };

    public ByteToCharEUC_TW() {
    }

    public int flush(char[] output, int outStart, int outEnd)
        throws MalformedInputException
    {
        if (state != G0) {
            state = G0;
            firstByte = 0;
            badInputLength = 0;
            throw new MalformedInputException();
        }
        reset();
        return 0;
    }

    public void reset() {
        state = G0;
        firstByte = 0;
        byteOff = charOff = 0;
    }

    
Character conversion
/** * Character conversion */
public int convert(byte[] input, int inOff, int inEnd, char[] output, int outOff, int outEnd) throws UnknownCharacterException, MalformedInputException, ConversionBufferFullException { int inputSize = 0; char outputChar = (char) 0; byteOff = inOff; charOff = outOff; cnsPlane = 3; while (byteOff < inEnd) { if (charOff >= outEnd) throw new ConversionBufferFullException(); switch (state) { case G0: if ( (input[byteOff] & MSB) == 0) { // ASCII outputChar = (char) input[byteOff]; } else if (input[byteOff] == SS2) { // Codeset 2 state = G2; } else { // Codeset 1 firstByte = input[byteOff]; state = G1; } break; case G1: inputSize = 2; if ( (input[byteOff] & MSB) != 0) { // 2nd byte cnsPlane = 1; outputChar = convToUnicode(firstByte, input[byteOff], unicodeCNS1); } else { // Error badInputLength = 1; throw new MalformedInputException(); } firstByte = 0; state = G0; break; case G2: cnsPlane = (input[byteOff] & (byte)0x0f); // Adjust String array index for plan 15 cnsPlane = (cnsPlane == 15)? 8 : cnsPlane; if (cnsPlane < 15) { state = G3; } else { badInputLength = 2; throw new MalformedInputException(); } break; case G3: if ( (input[byteOff] & MSB) != 0) { // 1st byte firstByte = input[byteOff]; state = G4; } else { // Error state = G0; badInputLength = 2; throw new MalformedInputException(); } break; case G4: if ( (input[byteOff] & MSB) != 0) { // 2nd byte outputChar = convToUnicode(firstByte, input[byteOff], cnsChars[cnsPlane - 2]); } else { // Error badInputLength = 3; throw new MalformedInputException(); } firstByte = 0; state = G0; break; } byteOff++; if (outputChar != (char) 0) { if (outputChar == REPLACE_CHAR) { if (subMode) // substitution enabled outputChar = subChars[0]; else { badInputLength = inputSize; throw new UnknownCharacterException(); } } output[charOff++] = outputChar; outputChar = 0; } } return charOff - outOff; }
Return the character set ID
/** * Return the character set ID */
public String getCharacterEncoding() { return "EUC_TW"; } protected char convToUnicode(byte byte1, byte byte2, String table) { int index; if ((byte1 & 0xff) < 0xa1 || (byte2 & 0xff) < 0xa1 || (byte1 & 0xff) > 0xfe || (byte2 & 0xff) > 0xfe) return REPLACE_CHAR; index = (((byte1 & 0xff) - 0xa1) * 94) + (byte2 & 0xff) - 0xa1; if (index < 0 || index >= table.length()) return REPLACE_CHAR; // Planes 3 and above containing zero value lead byte // to accommodate surrogates for mappings which decode to a surrogate // pair if (this.cnsPlane >= 3) index = (index * 2) + 1; return table.charAt(index); } }