jdk/src/share/classes/sun/nio/cs/ext/SJIS.java
changeset 13383 34e17f628599
parent 13382 d63c06178ebc
parent 13381 9d3762ef6332
child 13385 15512350dedf
equal deleted inserted replaced
13382:d63c06178ebc 13383:34e17f628599
     1 /*
       
     2  * Copyright (c) 2002, 2010, Oracle and/or its affiliates. All rights reserved.
       
     3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
       
     4  *
       
     5  * This code is free software; you can redistribute it and/or modify it
       
     6  * under the terms of the GNU General Public License version 2 only, as
       
     7  * published by the Free Software Foundation.  Oracle designates this
       
     8  * particular file as subject to the "Classpath" exception as provided
       
     9  * by Oracle in the LICENSE file that accompanied this code.
       
    10  *
       
    11  * This code is distributed in the hope that it will be useful, but WITHOUT
       
    12  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
       
    13  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
       
    14  * version 2 for more details (a copy is included in the LICENSE file that
       
    15  * accompanied this code).
       
    16  *
       
    17  * You should have received a copy of the GNU General Public License version
       
    18  * 2 along with this work; if not, write to the Free Software Foundation,
       
    19  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
       
    20  *
       
    21  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
       
    22  * or visit www.oracle.com if you need additional information or have any
       
    23  * questions.
       
    24  */
       
    25 
       
    26 /*
       
    27  */
       
    28 
       
    29 package sun.nio.cs.ext;
       
    30 
       
    31 import java.nio.ByteBuffer;
       
    32 import java.nio.CharBuffer;
       
    33 import java.nio.charset.Charset;
       
    34 import java.nio.charset.CharsetDecoder;
       
    35 import java.nio.charset.CharsetEncoder;
       
    36 import java.nio.charset.CoderResult;
       
    37 import sun.nio.cs.HistoricallyNamedCharset;
       
    38 
       
    39 public class SJIS
       
    40     extends Charset
       
    41     implements HistoricallyNamedCharset
       
    42 {
       
    43 
       
    44     public SJIS() {
       
    45         super("Shift_JIS", ExtendedCharsets.aliasesFor("Shift_JIS"));
       
    46     }
       
    47 
       
    48     public String historicalName() {
       
    49         return "SJIS";
       
    50     }
       
    51 
       
    52     public boolean contains(Charset cs) {
       
    53         return ((cs.name().equals("US-ASCII"))
       
    54                 || (cs instanceof JIS_X_0201)
       
    55                 || (cs instanceof SJIS)
       
    56                 || (cs instanceof JIS_X_0208));
       
    57     }
       
    58 
       
    59     public CharsetDecoder newDecoder() {
       
    60         return new Decoder(this);
       
    61     }
       
    62 
       
    63     public CharsetEncoder newEncoder() {
       
    64 
       
    65         // Need to force the replacement byte to 0x3f
       
    66         // because JIS_X_0208_Encoder defines its own
       
    67         // alternative 2 byte substitution to permit it
       
    68         // to exist as a self-standing Encoder
       
    69 
       
    70         byte[] replacementBytes = { (byte)0x3f };
       
    71         return new Encoder(this).replaceWith(replacementBytes);
       
    72     }
       
    73 
       
    74     static class Decoder extends JIS_X_0208_Decoder
       
    75         implements DelegatableDecoder {
       
    76 
       
    77         JIS_X_0201.Decoder jis0201;
       
    78 
       
    79         protected Decoder(Charset cs) {
       
    80             super(cs);
       
    81             jis0201 = new JIS_X_0201.Decoder(cs);
       
    82         }
       
    83 
       
    84         protected char decodeSingle(int b) {
       
    85             // If the high bits are all off, it's ASCII == Unicode
       
    86             if ((b & 0xFF80) == 0) {
       
    87                 return (char)b;
       
    88             }
       
    89             return jis0201.decode(b);
       
    90         }
       
    91 
       
    92         protected char decodeDouble(int c1, int c2) {
       
    93             int adjust = c2 < 0x9F ? 1 : 0;
       
    94             int rowOffset = c1 < 0xA0 ? 0x70 : 0xB0;
       
    95             int cellOffset = (adjust == 1) ? (c2 > 0x7F ? 0x20 : 0x1F) : 0x7E;
       
    96             int b1 = ((c1 - rowOffset) << 1) - adjust;
       
    97             int b2 = c2 - cellOffset;
       
    98             return super.decodeDouble(b1, b2);
       
    99         }
       
   100 
       
   101         // Make some protected methods public for use by JISAutoDetect
       
   102         public CoderResult decodeLoop(ByteBuffer src, CharBuffer dst) {
       
   103             return super.decodeLoop(src, dst);
       
   104         }
       
   105         public void implReset() {
       
   106             super.implReset();
       
   107         }
       
   108         public CoderResult implFlush(CharBuffer out) {
       
   109             return super.implFlush(out);
       
   110         }
       
   111     }
       
   112 
       
   113     static class Encoder extends JIS_X_0208_Encoder {
       
   114 
       
   115         private JIS_X_0201.Encoder jis0201;
       
   116 
       
   117         private static final short[] j0208Index1 =
       
   118             JIS_X_0208_Encoder.getIndex1();
       
   119         private static final String[] j0208Index2 =
       
   120             JIS_X_0208_Encoder.getIndex2();
       
   121 
       
   122         protected Encoder(Charset cs) {
       
   123             super(cs);
       
   124             jis0201 = new JIS_X_0201.Encoder(cs);
       
   125         }
       
   126 
       
   127         protected int encodeSingle(char inputChar) {
       
   128             byte b;
       
   129 
       
   130             // \u0000 - \u007F map straight through
       
   131             if ((inputChar & 0xFF80) == 0)
       
   132                 return (byte)inputChar;
       
   133 
       
   134             if ((b = jis0201.encode(inputChar)) == 0)
       
   135                 return -1;
       
   136             else
       
   137                 return b;
       
   138         }
       
   139 
       
   140         protected int encodeDouble(char ch) {
       
   141             int offset = j0208Index1[ch >> 8] << 8;
       
   142             int pos = j0208Index2[offset >> 12].charAt((offset & 0xfff) + (ch & 0xff));
       
   143             if (pos == 0) {
       
   144                 /* Zero value indicates this Unicode has no mapping to
       
   145                  * JIS0208.
       
   146                  * We bail here because the JIS -> SJIS algorithm produces
       
   147                  * bogus SJIS values for invalid JIS input.  Zero should be
       
   148                  * the only invalid JIS value in our table.
       
   149                  */
       
   150                 return 0;
       
   151             }
       
   152             /*
       
   153              * This algorithm for converting from JIS to SJIS comes from
       
   154              * Ken Lunde's "Understanding Japanese Information Processing",
       
   155              * pg 163.
       
   156              */
       
   157             int c1 = (pos >> 8) & 0xff;
       
   158             int c2 = pos & 0xff;
       
   159             int rowOffset = c1 < 0x5F ? 0x70 : 0xB0;
       
   160             int cellOffset = (c1 % 2 == 1) ? (c2 > 0x5F ? 0x20 : 0x1F) : 0x7E;
       
   161             return ((((c1 + 1 ) >> 1) + rowOffset) << 8) | (c2 + cellOffset);
       
   162         }
       
   163     }
       
   164 }