jdk/src/share/classes/sun/io/ByteToCharEUC_JP.java
changeset 10372 2f6d68f22eae
parent 10321 64f7ee2f31dd
parent 10371 7da2112e4236
child 10373 d4c5e59b82f8
equal deleted inserted replaced
10321:64f7ee2f31dd 10372:2f6d68f22eae
     1 /*
       
     2  * Copyright (c) 1996, 2003, Oracle and/or its affiliates. All rights reserved.
       
     3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
       
     4  *
       
     5  * This code is free software; you can redistribute it and/or modify it
       
     6  * under the terms of the GNU General Public License version 2 only, as
       
     7  * published by the Free Software Foundation.  Oracle designates this
       
     8  * particular file as subject to the "Classpath" exception as provided
       
     9  * by Oracle in the LICENSE file that accompanied this code.
       
    10  *
       
    11  * This code is distributed in the hope that it will be useful, but WITHOUT
       
    12  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
       
    13  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
       
    14  * version 2 for more details (a copy is included in the LICENSE file that
       
    15  * accompanied this code).
       
    16  *
       
    17  * You should have received a copy of the GNU General Public License version
       
    18  * 2 along with this work; if not, write to the Free Software Foundation,
       
    19  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
       
    20  *
       
    21  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
       
    22  * or visit www.oracle.com if you need additional information or have any
       
    23  * questions.
       
    24  */
       
    25 
       
    26 package sun.io;
       
    27 
       
    28 /**
       
    29  * @author Limin Shi
       
    30  */
       
    31 
       
    32 public class ByteToCharEUC_JP extends ByteToCharJIS0208 {
       
    33     private byte savedSecond = 0;
       
    34 
       
    35     ByteToCharJIS0201 bcJIS0201 = new ByteToCharJIS0201();
       
    36     ByteToCharJIS0212 bcJIS0212 = new ByteToCharJIS0212();
       
    37 
       
    38     public ByteToCharEUC_JP() {
       
    39         super();
       
    40         start = 0xA1;
       
    41         end = 0xFE;
       
    42         savedSecond = 0;
       
    43     }
       
    44 
       
    45     public int flush(char[] output, int outStart, int outEnd)
       
    46         throws MalformedInputException
       
    47     {
       
    48         if (savedSecond != 0) {
       
    49             reset();
       
    50             throw new MalformedInputException();
       
    51         }
       
    52         reset();
       
    53         return 0;
       
    54     }
       
    55 
       
    56     /**
       
    57      * Resets the converter.
       
    58      * Call this method to reset the converter to its initial state
       
    59      */
       
    60     public void reset() {
       
    61         super.reset();
       
    62         savedSecond = 0;
       
    63     }
       
    64 
       
    65     public String getCharacterEncoding() {
       
    66         return "EUC_JP";
       
    67     }
       
    68 
       
    69     protected char convSingleByte(int b) {
       
    70         if (b < 0 || b > 0x7F)
       
    71             return REPLACE_CHAR;
       
    72         return bcJIS0201.getUnicode(b);
       
    73     }
       
    74 
       
    75     protected char getUnicode(int byte1, int byte2) {
       
    76         if (byte1 == 0x8E) {
       
    77             return bcJIS0201.getUnicode(byte2 - 256);
       
    78         }
       
    79         // Fix for bug 4121358 - similar fix for bug 4117820 put
       
    80         // into ByteToCharDoubleByte.getUnicode()
       
    81         if (((byte1 < 0) || (byte1 > index1.length))
       
    82             || ((byte2 < start) || (byte2 > end)))
       
    83             return REPLACE_CHAR;
       
    84 
       
    85         int n = (index1[byte1 - 0x80] & 0xf) * (end - start + 1)
       
    86                 + (byte2 - start);
       
    87         return index2[index1[byte1 - 0x80] >> 4].charAt(n);
       
    88     }
       
    89 
       
    90     protected char decode0212(int byte1, int byte2) {
       
    91         return bcJIS0212.getUnicode(byte1, byte2);
       
    92     }
       
    93 
       
    94     /**
       
    95      * Converts sequences of bytes to characters.
       
    96      * Conversions that result in Exceptions can be restarted by calling
       
    97      * convert again, with appropriately modified parameters.
       
    98      * @return the characters written to output.
       
    99      * @param input byte array containing text in Double/single Byte
       
   100      * @param inStart offset in input array
       
   101      * @param inEnd offset of last byte to be converted
       
   102      * @param output character array to receive conversion result
       
   103      * @param outStart starting offset
       
   104      * @param outEnd offset of last byte to be written to
       
   105      * @throw UnsupportedCharacterException for any bytes
       
   106      * that cannot be converted to the external character set.
       
   107      */
       
   108     public int convert(byte[] input, int inOff, int inEnd,
       
   109                        char[] output, int outOff, int outEnd)
       
   110         throws UnknownCharacterException,
       
   111                ConversionBufferFullException
       
   112     {
       
   113         char    outputChar = REPLACE_CHAR;
       
   114         int     inputSize = 0;          // Size of input
       
   115 
       
   116         // Record beginning offsets
       
   117         charOff = outOff;
       
   118         byteOff = inOff;
       
   119 
       
   120         // Loop until we hit the end of the input
       
   121         while (byteOff < inEnd) {
       
   122             int byte1, byte2;
       
   123 
       
   124             if (savedByte == 0) {
       
   125                 byte1 = input[byteOff];
       
   126                 inputSize = 1;
       
   127             } else {
       
   128                 byte1 = savedByte;
       
   129                 savedByte = 0;
       
   130                 inputSize = 0;
       
   131             }
       
   132 
       
   133             outputChar = convSingleByte(byte1);
       
   134 
       
   135             if (outputChar == REPLACE_CHAR) {   // Multibyte char
       
   136                 if ((byte1 & 0xff) == 0x8F) {   // JIS0212
       
   137                     if (byteOff + inputSize + 1 >= inEnd) {
       
   138                         // split in the middle of a character
       
   139                         // save the first 2 bytes for next time around
       
   140                         savedByte = (byte) byte1;
       
   141                         byteOff += inputSize;
       
   142                         if (byteOff < inEnd) {
       
   143                             savedSecond = input[byteOff];
       
   144                             byteOff++;
       
   145                         }
       
   146                         break;
       
   147                     }
       
   148                     if (savedSecond != 0) {
       
   149                         byte1 = savedSecond & 0xff;
       
   150                         savedSecond = 0;
       
   151                     } else {
       
   152                         byte1 = input[byteOff + inputSize] & 0xff;
       
   153                         inputSize++;
       
   154                     }
       
   155                     byte2 = input[byteOff + inputSize] & 0xff;
       
   156                     inputSize++;
       
   157                     outputChar = decode0212(byte1-0x80, byte2-0x80);
       
   158                 } else { // JIS0208
       
   159                     if (byteOff + inputSize >= inEnd) {
       
   160                         // split in the middle of a character
       
   161                         // save the first byte for next time around
       
   162                         savedByte = (byte) byte1;
       
   163                         byteOff += inputSize;
       
   164                         break;
       
   165                     }
       
   166                     byte1 &= 0xff;
       
   167                     byte2 = input[byteOff + inputSize] & 0xff;
       
   168                     inputSize++;
       
   169                     outputChar = getUnicode(byte1, byte2);
       
   170                 }
       
   171             }
       
   172 
       
   173             if (outputChar == REPLACE_CHAR) {
       
   174                 if (subMode)
       
   175                     outputChar = subChars[0];
       
   176                 else {
       
   177                     badInputLength = inputSize;
       
   178                     throw new UnknownCharacterException();
       
   179                 }
       
   180             }
       
   181 
       
   182             if (charOff >= outEnd)
       
   183                 throw new ConversionBufferFullException();
       
   184 
       
   185             output[charOff++] = outputChar;
       
   186             byteOff += inputSize;
       
   187         }
       
   188 
       
   189         return charOff - outOff;
       
   190     }
       
   191 
       
   192 }