jdk/test/sun/nio/cs/TestUTF8BOM.java
author ohair
Tue, 25 May 2010 15:58:33 -0700
changeset 5506 202f599c92aa
parent 796 2c3db720c065
permissions -rw-r--r--
6943119: Rebrand source copyright notices Reviewed-by: darcy, weijun
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
796
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
     1
/*
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 796
diff changeset
     2
 * Copyright (c) 2008, Oracle and/or its affiliates. All rights reserved.
796
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
     4
 *
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
     7
 * published by the Free Software Foundation.
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
     8
 *
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
     9
 * This code is distributed in the hope that it will be useful, but WITHOUT
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    12
 * version 2 for more details (a copy is included in the LICENSE file that
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    13
 * accompanied this code).
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    14
 *
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    15
 * You should have received a copy of the GNU General Public License version
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    16
 * 2 along with this work; if not, write to the Free Software Foundation,
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    18
 *
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 796
diff changeset
    19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 796
diff changeset
    20
 * or visit www.oracle.com if you need additional information or have any
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 796
diff changeset
    21
 * questions.
796
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    22
 */
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    23
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    24
/* @test
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    25
   @bug 4508058 6378911
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    26
   @summary Check if UTF8 decoder handles BOM correctly
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    27
 */
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    28
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    29
import java.io.IOException;
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    30
import java.nio.BufferOverflowException;
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    31
import java.nio.*;
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    32
import java.nio.charset.*;
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    33
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    34
/* The fix for 6378911 is to backout the change we made for 4508058,
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    35
   so this regtest is modified accordingly to leave the beginning
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    36
   BOM untouched during decoding.
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    37
 */
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    38
public class TestUTF8BOM {
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    39
    private static ByteBuffer bf = ByteBuffer.allocateDirect(1000);
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    40
    private static void testDecode(String expected, byte[] input)
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    41
        throws Exception
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    42
    {
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    43
        String out = new String(input, "utf8");
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    44
        if (!out.equals(expected)) {
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    45
            failureReport (out, expected);
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    46
            throw new Exception("UTF_8 Decoding test failed");
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    47
        }
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    48
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    49
        //try directBuffer.
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    50
        bf.clear();
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    51
        bf.put(input).flip();
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    52
        out = Charset.forName("UTF-8")
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    53
                     .decode(bf)
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    54
                     .toString();
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    55
        if (!out.equals(expected)) {
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    56
            failureReport (out, expected);
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    57
            throw new Exception("UTF_8 Decoding test failed(directbuffer)");
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    58
        }
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    59
    }
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    60
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    61
    private static void failureReport(String testStr,
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    62
                                      String expected) {
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    63
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    64
        System.err.println ("Expected Characters:");
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    65
        for (int i = 0; i < expected.length() ; i++) {
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    66
            System.out.println("expected char[" + i + "] : " +
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    67
                              Integer.toHexString((int)expected.charAt(i)) +
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    68
                              "  obtained char[" + i + "] : " +
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    69
                              Integer.toHexString((int)testStr.charAt(i)));
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    70
        }
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    71
    }
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    72
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    73
    public static void main (String[] args) throws Exception {
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    74
            // Test 1: with BOM at beginning
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    75
            testDecode("\ufeff\u0092\u0093",
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    76
                        new byte[] { (byte) 0xef, (byte) 0xbb, (byte) 0xbf,
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    77
                                     (byte) 0xc2, (byte) 0x92,
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    78
                                     (byte) 0xc2, (byte) 0x93 });
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    79
            // Test 2: with BOM at middle
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    80
            testDecode("\u9200\ufeff\u9300",
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    81
                        new byte[] { (byte) 0xe9, (byte) 0x88, (byte) 0x80,
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    82
                                     (byte) 0xef, (byte) 0xbb, (byte) 0xbf,
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    83
                                     (byte) 0xe9, (byte) 0x8c, (byte) 0x80 });
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    84
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    85
            // Test 3: with BOM at end
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    86
            testDecode("\u9200\u9300\ufeff",
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    87
                        new byte[] { (byte) 0xe9, (byte) 0x88, (byte) 0x80,
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    88
                                     (byte) 0xe9, (byte) 0x8c, (byte) 0x80,
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    89
                                     (byte) 0xef, (byte) 0xbb, (byte) 0xbf });
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    90
            System.err.println ("\nPASSED UTF-8 decode BOM test");
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    91
   }
2c3db720c065 6675856: Open charset tests
sherman
parents:
diff changeset
    92
}