jdk/src/share/classes/sun/reflect/UTF8.java
author sherman
Tue, 30 Aug 2011 11:53:11 -0700
changeset 10419 12c063b39232
parent 5506 202f599c92aa
child 14342 8435a30053c1
permissions -rw-r--r--
7084245: Update usages of InternalError to use exception chaining Summary: to use new InternalError constructor with cause chainning Reviewed-by: alanb, ksrini, xuelei, neugens Contributed-by: sebastian.sickelmann@gmx.de
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
     1
/*
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
     2
 * Copyright (c) 2001, Oracle and/or its affiliates. All rights reserved.
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
90ce3da70b43 Initial load
duke
parents:
diff changeset
     4
 *
90ce3da70b43 Initial load
duke
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
90ce3da70b43 Initial load
duke
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
     7
 * published by the Free Software Foundation.  Oracle designates this
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
     8
 * particular file as subject to the "Classpath" exception as provided
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
     9
 * by Oracle in the LICENSE file that accompanied this code.
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
    10
 *
90ce3da70b43 Initial load
duke
parents:
diff changeset
    11
 * This code is distributed in the hope that it will be useful, but WITHOUT
90ce3da70b43 Initial load
duke
parents:
diff changeset
    12
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
90ce3da70b43 Initial load
duke
parents:
diff changeset
    13
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
90ce3da70b43 Initial load
duke
parents:
diff changeset
    14
 * version 2 for more details (a copy is included in the LICENSE file that
90ce3da70b43 Initial load
duke
parents:
diff changeset
    15
 * accompanied this code).
90ce3da70b43 Initial load
duke
parents:
diff changeset
    16
 *
90ce3da70b43 Initial load
duke
parents:
diff changeset
    17
 * You should have received a copy of the GNU General Public License version
90ce3da70b43 Initial load
duke
parents:
diff changeset
    18
 * 2 along with this work; if not, write to the Free Software Foundation,
90ce3da70b43 Initial load
duke
parents:
diff changeset
    19
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
90ce3da70b43 Initial load
duke
parents:
diff changeset
    20
 *
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
    21
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
    22
 * or visit www.oracle.com if you need additional information or have any
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
    23
 * questions.
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
    24
 */
90ce3da70b43 Initial load
duke
parents:
diff changeset
    25
90ce3da70b43 Initial load
duke
parents:
diff changeset
    26
package sun.reflect;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    27
90ce3da70b43 Initial load
duke
parents:
diff changeset
    28
/** It is necessary to use a "bootstrap" UTF-8 encoder for encoding
90ce3da70b43 Initial load
duke
parents:
diff changeset
    29
    constant pool entries because the character set converters rely on
90ce3da70b43 Initial load
duke
parents:
diff changeset
    30
    Class.newInstance(). */
90ce3da70b43 Initial load
duke
parents:
diff changeset
    31
90ce3da70b43 Initial load
duke
parents:
diff changeset
    32
class UTF8 {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    33
    // This encoder is not quite correct.  It does not handle surrogate pairs.
90ce3da70b43 Initial load
duke
parents:
diff changeset
    34
    static byte[] encode(String str) {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    35
        int len = str.length();
90ce3da70b43 Initial load
duke
parents:
diff changeset
    36
        byte[] res = new byte[utf8Length(str)];
90ce3da70b43 Initial load
duke
parents:
diff changeset
    37
        int utf8Idx = 0;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    38
        try {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    39
            for (int i = 0; i < len; i++) {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    40
                int c = str.charAt(i) & 0xFFFF;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    41
                if (c >= 0x0001 && c <= 0x007F) {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    42
                    res[utf8Idx++] = (byte) c;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    43
                } else if (c == 0x0000 ||
90ce3da70b43 Initial load
duke
parents:
diff changeset
    44
                           (c >= 0x0080 && c <= 0x07FF)) {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    45
                    res[utf8Idx++] = (byte) (0xC0 + (c >> 6));
90ce3da70b43 Initial load
duke
parents:
diff changeset
    46
                    res[utf8Idx++] = (byte) (0x80 + (c & 0x3F));
90ce3da70b43 Initial load
duke
parents:
diff changeset
    47
                } else {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    48
                    res[utf8Idx++] = (byte) (0xE0 + (c >> 12));
90ce3da70b43 Initial load
duke
parents:
diff changeset
    49
                    res[utf8Idx++] = (byte) (0x80 + ((c >> 6) & 0x3F));
90ce3da70b43 Initial load
duke
parents:
diff changeset
    50
                    res[utf8Idx++] = (byte) (0x80 + (c & 0x3F));
90ce3da70b43 Initial load
duke
parents:
diff changeset
    51
                }
90ce3da70b43 Initial load
duke
parents:
diff changeset
    52
            }
90ce3da70b43 Initial load
duke
parents:
diff changeset
    53
        } catch (ArrayIndexOutOfBoundsException e) {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    54
            throw new InternalError
10419
12c063b39232 7084245: Update usages of InternalError to use exception chaining
sherman
parents: 5506
diff changeset
    55
                ("Bug in sun.reflect bootstrap UTF-8 encoder", e);
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
    56
        }
90ce3da70b43 Initial load
duke
parents:
diff changeset
    57
        return res;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    58
    }
90ce3da70b43 Initial load
duke
parents:
diff changeset
    59
90ce3da70b43 Initial load
duke
parents:
diff changeset
    60
    private static int utf8Length(String str) {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    61
        int len = str.length();
90ce3da70b43 Initial load
duke
parents:
diff changeset
    62
        int utf8Len = 0;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    63
        for (int i = 0; i < len; i++) {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    64
            int c = str.charAt(i) & 0xFFFF;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    65
            if (c >= 0x0001 && c <= 0x007F) {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    66
                utf8Len += 1;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    67
            } else if (c == 0x0000 ||
90ce3da70b43 Initial load
duke
parents:
diff changeset
    68
                       (c >= 0x0080 && c <= 0x07FF)) {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    69
                utf8Len += 2;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    70
            } else {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    71
                utf8Len += 3;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    72
            }
90ce3da70b43 Initial load
duke
parents:
diff changeset
    73
        }
90ce3da70b43 Initial load
duke
parents:
diff changeset
    74
        return utf8Len;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    75
    }
90ce3da70b43 Initial load
duke
parents:
diff changeset
    76
}