jdk/test/java/lang/String/Encodings.java
changeset 2 90ce3da70b43
child 5506 202f599c92aa
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/jdk/test/java/lang/String/Encodings.java	Sat Dec 01 00:00:00 2007 +0000
@@ -0,0 +1,179 @@
+/*
+ * Copyright 1999-2006 Sun Microsystems, Inc.  All Rights Reserved.
+ * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
+ *
+ * This code is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 2 only, as
+ * published by the Free Software Foundation.
+ *
+ * This code is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * version 2 for more details (a copy is included in the LICENSE file that
+ * accompanied this code).
+ *
+ * You should have received a copy of the GNU General Public License version
+ * 2 along with this work; if not, write to the Free Software Foundation,
+ * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
+ *
+ * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
+ * CA 95054 USA or visit www.sun.com if you need additional information or
+ * have any questions.
+ */
+
+/* @test
+ * @bug 4085160 4139951 5005831
+ * @summary Test that required character encodings are supported
+ */
+
+import java.io.InputStreamReader;
+import java.io.OutputStreamWriter;
+import java.io.ByteArrayInputStream;
+import java.io.ByteArrayOutputStream;
+import java.nio.charset.Charset;
+import java.nio.charset.UnsupportedCharsetException;
+
+
+public class Encodings {
+
+
+    static boolean equals(byte[] a, byte[] b) {
+        if (a.length != b.length) return false;
+        for (int i = 0; i < a.length; i++)
+            if (a[i] != b[i]) return false;
+        return true;
+    }
+
+
+    static void go(String enc, String str, final byte[] bytes, boolean bidir)
+        throws Exception
+    {
+        final Charset charset = Charset.forName(enc);
+
+        /* String(byte[] bs, String enc) */
+        if (!(new String(bytes, enc).equals(str)))
+            throw new Exception(enc + ": String constructor failed");
+
+        /* String(byte[] bs, Charset charset) */
+        if (!(new String(bytes, charset).equals(str)))
+            throw new Exception(charset + ": String constructor failed");
+
+        /* String(byte[] bs, int off, int len, Charset charset) */
+        String start = str.substring(0, 2);
+        String end = str.substring(2);
+        if (enc.equals("UTF-16BE") || enc.equals("UTF-16LE")) {
+            if (!(new String(bytes, 0, 4, charset).equals(start)))
+                throw new Exception(charset + ": String constructor failed");
+            if (!(new String(bytes, 4, bytes.length - 4, charset).equals(end)))
+                throw new Exception(charset + ": String constructor failed");
+        } else if (enc.equals("UTF-16")) {
+            if (!(new String(bytes, 0, 6, charset).equals(start)))
+                throw new Exception(charset + ": String constructor failed");
+        } else {
+            if (!(new String(bytes, 0, 2, charset).equals(start)))
+                throw new Exception(charset + ": String constructor failed");
+            if (!(new String(bytes, 2, bytes.length - 2, charset).equals(end)))
+                throw new Exception(charset + ": String constructor failed");
+        }
+
+        /* InputStreamReader */
+        ByteArrayInputStream bi = new ByteArrayInputStream(bytes);
+        InputStreamReader r = new InputStreamReader(bi, enc);
+        String inEnc = r.getEncoding();
+        int n = str.length();
+        char[] cs = new char[n];
+        for (int i = 0; i < n;) {
+            int m;
+            if ((m = r.read(cs, i, n - i)) < 0)
+                throw new Exception(enc + ": EOF on InputStreamReader");
+            i += m;
+        }
+        if (!(new String(cs).equals(str)))
+            throw new Exception(enc + ": InputStreamReader failed");
+
+        if (!bidir) {
+            System.err.println(enc + " --> " + inEnc);
+            return;
+        }
+
+        /* String.getBytes(String enc) */
+        byte[] bs = str.getBytes(enc);
+        if (!equals(bs, bytes))
+            throw new Exception(enc + ": String.getBytes failed");
+
+        /* String.getBytes(Charset charset) */
+        bs = str.getBytes(charset);
+        if (!equals(bs, bytes))
+            throw new Exception(charset + ": String.getBytes failed");
+
+        // Calls to String.getBytes(Charset) shouldn't automatically
+        // use the cached thread-local encoder.
+        if (charset.name().equals("UTF-16BE")) {
+            String s = new String(bytes, charset);
+            // Replace the thread-local encoder with this one.
+            byte[] bb = s.getBytes(Charset.forName("UTF-16LE"));
+            if (bytes.length != bb.length) {
+                // Incidental test.
+                throw new RuntimeException("unequal length: "
+                                           + bytes.length + " != "
+                                           + bb.length);
+            } else {
+                boolean diff = false;
+                // Expect different byte[] between UTF-16LE and UTF-16BE
+                // even though encoder was previously cached by last call
+                // to getBytes().
+                for (int i = 0; i < bytes.length; i++) {
+                    if (bytes[i] != bb[i])
+                        diff = true;
+                }
+                if (!diff)
+                    throw new RuntimeException("byte arrays equal");
+            }
+        }
+
+        /* OutputStreamWriter */
+        ByteArrayOutputStream bo = new ByteArrayOutputStream();
+        OutputStreamWriter w = new OutputStreamWriter(bo, enc);
+        String outEnc = w.getEncoding();
+        w.write(str);
+        w.close();
+        bs = bo.toByteArray();
+        if (!equals(bs, bytes))
+            throw new Exception(enc + ": OutputStreamWriter failed");
+
+        System.err.println(enc + " --> " + inEnc + " / " + outEnc);
+    }
+
+
+    static void go(String enc, String str, byte[] bytes) throws Exception {
+        go(enc, str, bytes, true);
+    }
+
+
+    public static void main(String[] args) throws Exception {
+
+        go("US-ASCII", "abc", new byte[] { 'a', 'b', 'c' });
+        go("us-ascii", "abc", new byte[] { 'a', 'b', 'c' });
+        go("ISO646-US", "abc", new byte[] { 'a', 'b', 'c' });
+        go("ISO-8859-1", "ab\u00c7", new byte[] { 'a', 'b', (byte)'\u00c7' });
+        go("UTF-8", "ab\u1e09",
+           new byte[] { 'a', 'b',
+                        (byte)(0xe0 | (0x0f & (0x1e09 >> 12))),
+                        (byte)(0x80 | (0x3f & (0x1e09 >> 6))),
+                        (byte)(0x80 | (0x3f & 0x1e09)) });
+        go("UTF-16BE", "ab\u1e09",
+           new byte[] { 0, 'a', 0, 'b', 0x1e, 0x09 });
+        go("UTF-16LE", "ab\u1e09",
+           new byte[] { 'a', 0, 'b', 0, 0x09, 0x1e });
+
+        /* UTF-16 accepts both byte orders on input but always uses big-endian
+         * on output, so test all three cases
+         */
+        go("UTF-16", "ab\u1e09",
+           new byte[] { (byte)0xfe, (byte)0xff, 0, 'a', 0, 'b', 0x1e, 0x09 });
+        go("UTF-16", "ab\u1e09",
+           new byte[] { (byte)0xff, (byte)0xfe, 'a', 0, 'b', 0, 0x09, 0x1e },
+           false);
+    }
+
+}