jdk/test/sun/nio/cs/TestUTF8BOM.java
author never
Mon, 12 Jul 2010 22:27:18 -0700
changeset 5926 a36f90d986b6
parent 5506 202f599c92aa
permissions -rw-r--r--
6968385: malformed xml in sweeper logging Reviewed-by: kvn

/*
 * Copyright (c) 2008, Oracle and/or its affiliates. All rights reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 * or visit www.oracle.com if you need additional information or have any
 * questions.
 */

/* @test
   @bug 4508058 6378911
   @summary Check if UTF8 decoder handles BOM correctly
 */

import java.io.IOException;
import java.nio.BufferOverflowException;
import java.nio.*;
import java.nio.charset.*;

/* The fix for 6378911 is to backout the change we made for 4508058,
   so this regtest is modified accordingly to leave the beginning
   BOM untouched during decoding.
 */
public class TestUTF8BOM {
    private static ByteBuffer bf = ByteBuffer.allocateDirect(1000);
    private static void testDecode(String expected, byte[] input)
        throws Exception
    {
        String out = new String(input, "utf8");
        if (!out.equals(expected)) {
            failureReport (out, expected);
            throw new Exception("UTF_8 Decoding test failed");
        }

        //try directBuffer.
        bf.clear();
        bf.put(input).flip();
        out = Charset.forName("UTF-8")
                     .decode(bf)
                     .toString();
        if (!out.equals(expected)) {
            failureReport (out, expected);
            throw new Exception("UTF_8 Decoding test failed(directbuffer)");
        }
    }

    private static void failureReport(String testStr,
                                      String expected) {

        System.err.println ("Expected Characters:");
        for (int i = 0; i < expected.length() ; i++) {
            System.out.println("expected char[" + i + "] : " +
                              Integer.toHexString((int)expected.charAt(i)) +
                              "  obtained char[" + i + "] : " +
                              Integer.toHexString((int)testStr.charAt(i)));
        }
    }

    public static void main (String[] args) throws Exception {
            // Test 1: with BOM at beginning
            testDecode("\ufeff\u0092\u0093",
                        new byte[] { (byte) 0xef, (byte) 0xbb, (byte) 0xbf,
                                     (byte) 0xc2, (byte) 0x92,
                                     (byte) 0xc2, (byte) 0x93 });
            // Test 2: with BOM at middle
            testDecode("\u9200\ufeff\u9300",
                        new byte[] { (byte) 0xe9, (byte) 0x88, (byte) 0x80,
                                     (byte) 0xef, (byte) 0xbb, (byte) 0xbf,
                                     (byte) 0xe9, (byte) 0x8c, (byte) 0x80 });

            // Test 3: with BOM at end
            testDecode("\u9200\u9300\ufeff",
                        new byte[] { (byte) 0xe9, (byte) 0x88, (byte) 0x80,
                                     (byte) 0xe9, (byte) 0x8c, (byte) 0x80,
                                     (byte) 0xef, (byte) 0xbb, (byte) 0xbf });
            System.err.println ("\nPASSED UTF-8 decode BOM test");
   }
}