jdk/src/java.base/share/classes/java/lang/StringUTF16.java
author chegar
Tue, 08 Mar 2016 12:11:07 +0000
changeset 36411 f0cd8358b5ea
parent 34711 65544417508e
child 38790 b74a24c96491
permissions -rw-r--r--
8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator Reviewed-by: shade, sherman
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     1
/*
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     2
 * Copyright (c) 2015, Oracle and/or its affiliates. All rights reserved.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     4
 *
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     7
 * published by the Free Software Foundation.  Oracle designates this
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     8
 * particular file as subject to the "Classpath" exception as provided
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     9
 * by Oracle in the LICENSE file that accompanied this code.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    10
 *
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    11
 * This code is distributed in the hope that it will be useful, but WITHOUT
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    12
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    13
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    14
 * version 2 for more details (a copy is included in the LICENSE file that
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    15
 * accompanied this code).
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    16
 *
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    17
 * You should have received a copy of the GNU General Public License version
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    18
 * 2 along with this work; if not, write to the Free Software Foundation,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    19
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    20
 *
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    21
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    22
 * or visit www.oracle.com if you need additional information or have any
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    23
 * questions.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    24
 */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    25
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    26
package java.lang;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    27
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    28
import java.util.Arrays;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    29
import java.util.Locale;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    30
import java.util.Spliterator;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    31
import java.util.function.IntConsumer;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    32
import jdk.internal.HotSpotIntrinsicCandidate;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    33
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    34
import static java.lang.String.UTF16;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    35
import static java.lang.String.LATIN1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    36
import static java.lang.String.checkIndex;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    37
import static java.lang.String.checkOffset;
34517
c6e795a80c80 8142303: C2 compilation fails with "bad AD file"
thartmann
parents: 33663
diff changeset
    38
import static java.lang.String.checkBoundsOffCount;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    39
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    40
final class StringUTF16 {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    41
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    42
    public static byte[] newBytesFor(int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    43
        if (len < 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    44
            throw new NegativeArraySizeException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    45
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    46
        if (len > MAX_LENGTH) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    47
            throw new OutOfMemoryError("UTF16 String size is " + len +
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    48
                                       ", should be less than " + MAX_LENGTH);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    49
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    50
        return new byte[len << 1];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    51
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    52
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    53
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    54
    public static void putChar(byte[] val, int index, int c) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    55
        index <<= 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    56
        val[index++] = (byte)(c >> HI_BYTE_SHIFT);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    57
        val[index]   = (byte)(c >> LO_BYTE_SHIFT);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    58
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    59
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    60
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    61
    public static char getChar(byte[] val, int index) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    62
        index <<= 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    63
        return (char)(((val[index++] & 0xff) << HI_BYTE_SHIFT) |
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    64
                      ((val[index]   & 0xff) << LO_BYTE_SHIFT));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    65
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    66
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    67
    public static char charAt(byte[] value, int index) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    68
        if (index < 0 || index >= value.length >> 1) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    69
            throw new StringIndexOutOfBoundsException(index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    70
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    71
        return getChar(value, index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    72
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    73
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    74
    public static int length(byte[] value) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    75
        return value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    76
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    77
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    78
    public static int codePointAt(byte[] value, int index, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    79
        char c1 = getChar(value, index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    80
        if (Character.isHighSurrogate(c1) && ++index < end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    81
            char c2 = getChar(value, index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    82
            if (Character.isLowSurrogate(c2)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    83
               return Character.toCodePoint(c1, c2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    84
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    85
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    86
        return c1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    87
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    88
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    89
    public static int codePointBefore(byte[] value, int index) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    90
        char c2 = getChar(value, --index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    91
        if (Character.isLowSurrogate(c2) && index > 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    92
            char c1 = getChar(value, --index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    93
            if (Character.isHighSurrogate(c1)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    94
               return Character.toCodePoint(c1, c2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    95
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    96
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    97
        return c2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    98
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    99
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   100
    public static int codePointCount(byte[] value, int beginIndex, int endIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   101
        int count = endIndex - beginIndex;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   102
        for (int i = beginIndex; i < endIndex; ) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   103
            if (Character.isHighSurrogate(getChar(value, i++)) &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   104
                i < endIndex &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   105
                Character.isLowSurrogate(getChar(value, i))) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   106
                count--;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   107
                i++;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   108
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   109
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   110
        return count;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   111
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   112
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   113
    public static char[] toChars(byte[] value) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   114
        char[] dst = new char[value.length >> 1];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   115
        getChars(value, 0, dst.length, dst, 0);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   116
        return dst;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   117
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   118
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   119
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   120
    public static byte[] toBytes(char[] value, int off, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   121
        byte[] val = newBytesFor(len);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   122
        for (int i = 0; i < len; i++) {
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   123
            putChar(val, i, value[off]);
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   124
            off++;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   125
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   126
        return val;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   127
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   128
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   129
    public static byte[] compress(char[] val, int off, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   130
        byte[] ret = new byte[len];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   131
        if (compress(val, off, ret, 0, len) == len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   132
            return ret;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   133
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   134
        return null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   135
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   136
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   137
    public static byte[] compress(byte[] val, int off, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   138
        byte[] ret = new byte[len];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   139
        if (compress(val, off, ret, 0, len) == len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   140
            return ret;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   141
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   142
        return null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   143
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   144
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   145
    // compressedCopy char[] -> byte[]
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   146
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   147
    private static int compress(char[] src, int srcOff, byte[] dst, int dstOff, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   148
        for (int i = 0; i < len; i++) {
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   149
            char c = src[srcOff];
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   150
            if (c > 0xFF) {
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   151
                len = 0;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   152
                break;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   153
            }
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   154
            dst[dstOff] = (byte)c;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   155
            srcOff++;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   156
            dstOff++;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   157
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   158
        return len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   159
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   160
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   161
    // compressedCopy byte[] -> byte[]
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   162
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   163
    public static int compress(byte[] src, int srcOff, byte[] dst, int dstOff, int len) {
34517
c6e795a80c80 8142303: C2 compilation fails with "bad AD file"
thartmann
parents: 33663
diff changeset
   164
        // We need a range check here because 'getChar' has no checks
c6e795a80c80 8142303: C2 compilation fails with "bad AD file"
thartmann
parents: 33663
diff changeset
   165
        checkBoundsOffCount(srcOff, len, src.length);
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   166
        for (int i = 0; i < len; i++) {
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   167
            char c = getChar(src, srcOff);
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   168
            if (c > 0xFF) {
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   169
                len = 0;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   170
                break;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   171
            }
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   172
            dst[dstOff] = (byte)c;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   173
            srcOff++;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   174
            dstOff++;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   175
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   176
        return len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   177
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   178
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   179
    public static byte[] toBytes(int[] val, int index, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   180
        final int end = index + len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   181
        // Pass 1: Compute precise size of char[]
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   182
        int n = len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   183
        for (int i = index; i < end; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   184
            int cp = val[i];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   185
            if (Character.isBmpCodePoint(cp))
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   186
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   187
            else if (Character.isValidCodePoint(cp))
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   188
                n++;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   189
            else throw new IllegalArgumentException(Integer.toString(cp));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   190
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   191
        // Pass 2: Allocate and fill in <high, low> pair
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   192
        byte[] buf = newBytesFor(n);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   193
        for (int i = index, j = 0; i < end; i++, j++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   194
            int cp = val[i];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   195
            if (Character.isBmpCodePoint(cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   196
                putChar(buf, j, cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   197
            } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   198
                putChar(buf, j++, Character.highSurrogate(cp));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   199
                putChar(buf, j, Character.lowSurrogate(cp));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   200
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   201
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   202
        return buf;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   203
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   204
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   205
    public static byte[] toBytes(char c) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   206
        byte[] result = new byte[2];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   207
        putChar(result, 0, c);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   208
        return result;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   209
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   210
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   211
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   212
    public static void getChars(byte[] value, int srcBegin, int srcEnd, char dst[], int dstBegin) {
34517
c6e795a80c80 8142303: C2 compilation fails with "bad AD file"
thartmann
parents: 33663
diff changeset
   213
        // We need a range check here because 'getChar' has no checks
c6e795a80c80 8142303: C2 compilation fails with "bad AD file"
thartmann
parents: 33663
diff changeset
   214
        checkBoundsOffCount(srcBegin, srcEnd - srcBegin, value.length);
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   215
        for (int i = srcBegin; i < srcEnd; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   216
            dst[dstBegin++] = getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   217
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   218
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   219
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   220
    /* @see java.lang.String.getBytes(int, int, byte[], int) */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   221
    public static void getBytes(byte[] value, int srcBegin, int srcEnd, byte dst[], int dstBegin) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   222
        srcBegin <<= 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   223
        srcEnd <<= 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   224
        for (int i = srcBegin + (1 >> LO_BYTE_SHIFT); i < srcEnd; i += 2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   225
            dst[dstBegin++] = value[i];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   226
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   227
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   228
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   229
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   230
    public static boolean equals(byte[] value, byte[] other) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   231
        if (value.length == other.length) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   232
            int len = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   233
            for (int i = 0; i < len; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   234
                if (getChar(value, i) != getChar(other, i)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   235
                    return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   236
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   237
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   238
            return true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   239
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   240
        return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   241
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   242
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   243
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   244
    public static int compareTo(byte[] value, byte[] other) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   245
        int len1 = length(value);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   246
        int len2 = length(other);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   247
        int lim = Math.min(len1, len2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   248
        for (int k = 0; k < lim; k++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   249
            char c1 = getChar(value, k);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   250
            char c2 = getChar(other, k);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   251
            if (c1 != c2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   252
                return c1 - c2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   253
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   254
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   255
        return len1 - len2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   256
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   257
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   258
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   259
    public static int compareToLatin1(byte[] value, byte[] other) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   260
        int len1 = length(value);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   261
        int len2 = StringLatin1.length(other);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   262
        int lim = Math.min(len1, len2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   263
        for (int k = 0; k < lim; k++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   264
            char c1 = getChar(value, k);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   265
            char c2 = StringLatin1.getChar(other, k);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   266
            if (c1 != c2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   267
                return c1 - c2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   268
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   269
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   270
        return len1 - len2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   271
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   272
36411
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   273
    public static int compareToCI(byte[] value, byte[] other) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   274
        int len1 = length(value);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   275
        int len2 = length(other);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   276
        int lim = Math.min(len1, len2);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   277
        for (int k = 0; k < lim; k++) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   278
            char c1 = getChar(value, k);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   279
            char c2 = getChar(other, k);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   280
            if (c1 != c2) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   281
                c1 = Character.toUpperCase(c1);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   282
                c2 = Character.toUpperCase(c2);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   283
                if (c1 != c2) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   284
                    c1 = Character.toLowerCase(c1);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   285
                    c2 = Character.toLowerCase(c2);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   286
                    if (c1 != c2) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   287
                        return c1 - c2;
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   288
                    }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   289
                }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   290
            }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   291
        }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   292
        return len1 - len2;
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   293
    }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   294
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   295
    public static int compareToCI_Latin1(byte[] value, byte[] other) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   296
        int len1 = length(value);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   297
        int len2 = StringLatin1.length(other);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   298
        int lim = Math.min(len1, len2);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   299
        for (int k = 0; k < lim; k++) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   300
            char c1 = getChar(value, k);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   301
            char c2 = StringLatin1.getChar(other, k);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   302
            if (c1 != c2) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   303
                c1 = Character.toUpperCase(c1);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   304
                c2 = Character.toUpperCase(c2);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   305
                if (c1 != c2) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   306
                    c1 = Character.toLowerCase(c1);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   307
                    c2 = Character.toLowerCase(c2);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   308
                    if (c1 != c2) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   309
                        return c1 - c2;
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   310
                    }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   311
                }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   312
            }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   313
        }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   314
        return len1 - len2;
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   315
    }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   316
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   317
    public static int hashCode(byte[] value) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   318
        int h = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   319
        int length = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   320
        for (int i = 0; i < length; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   321
            h = 31 * h + getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   322
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   323
        return h;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   324
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   325
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   326
    public static int indexOf(byte[] value, int ch, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   327
        int max = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   328
        if (fromIndex < 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   329
            fromIndex = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   330
        } else if (fromIndex >= max) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   331
            // Note: fromIndex might be near -1>>>1.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   332
            return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   333
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   334
        if (ch < Character.MIN_SUPPLEMENTARY_CODE_POINT) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   335
            // handle most cases here (ch is a BMP code point or a
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   336
            // negative value (invalid code point))
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   337
            return indexOfChar(value, ch, fromIndex, max);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   338
        } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   339
            return indexOfSupplementary(value, ch, fromIndex, max);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   340
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   341
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   342
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   343
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   344
    public static int indexOf(byte[] value, byte[] str) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   345
        if (str.length == 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   346
            return 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   347
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   348
        if (value.length == 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   349
            return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   350
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   351
        return indexOf(value, length(value), str, length(str), 0);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   352
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   353
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   354
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   355
    public static int indexOf(byte[] value, int valueCount, byte[] str, int strCount, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   356
        char first = getChar(str, 0);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   357
        int max = (valueCount - strCount);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   358
        for (int i = fromIndex; i <= max; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   359
            // Look for first character.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   360
            if (getChar(value, i) != first) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   361
                while (++i <= max && getChar(value, i) != first);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   362
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   363
            // Found first character, now look at the rest of value
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   364
            if (i <= max) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   365
                int j = i + 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   366
                int end = j + strCount - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   367
                for (int k = 1; j < end && getChar(value, j) == getChar(str, k); j++, k++);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   368
                if (j == end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   369
                    // Found whole string.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   370
                    return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   371
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   372
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   373
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   374
        return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   375
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   376
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   377
    /**
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   378
     * Handles indexOf Latin1 substring in UTF16 string.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   379
     */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   380
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   381
    public static int indexOfLatin1(byte[] value, byte[] str) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   382
        if (str.length == 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   383
            return 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   384
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   385
        if (value.length == 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   386
            return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   387
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   388
        return indexOfLatin1(value, length(value), str, str.length, 0);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   389
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   390
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   391
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   392
    public static int indexOfLatin1(byte[] src, int srcCount, byte[] tgt, int tgtCount, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   393
        char first = (char)(tgt[0] & 0xff);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   394
        int max = (srcCount - tgtCount);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   395
        for (int i = fromIndex; i <= max; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   396
            // Look for first character.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   397
            if (getChar(src, i) != first) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   398
                while (++i <= max && getChar(src, i) != first);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   399
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   400
            // Found first character, now look at the rest of v2
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   401
            if (i <= max) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   402
                int j = i + 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   403
                int end = j + tgtCount - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   404
                for (int k = 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   405
                     j < end && getChar(src, j) == (tgt[k] & 0xff);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   406
                     j++, k++);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   407
                if (j == end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   408
                    // Found whole string.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   409
                    return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   410
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   411
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   412
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   413
        return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   414
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   415
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   416
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   417
    private static int indexOfChar(byte[] value, int ch, int fromIndex, int max) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   418
        for (int i = fromIndex; i < max; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   419
            if (getChar(value, i) == ch) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   420
                return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   421
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   422
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   423
        return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   424
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   425
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   426
    /**
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   427
     * Handles (rare) calls of indexOf with a supplementary character.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   428
     */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   429
    private static int indexOfSupplementary(byte[] value, int ch, int fromIndex, int max) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   430
        if (Character.isValidCodePoint(ch)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   431
            final char hi = Character.highSurrogate(ch);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   432
            final char lo = Character.lowSurrogate(ch);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   433
            for (int i = fromIndex; i < max - 1; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   434
                if (getChar(value, i) == hi && getChar(value, i + 1 ) == lo) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   435
                    return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   436
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   437
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   438
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   439
        return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   440
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   441
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   442
    public static int lastIndexOf(byte[] src, int srcCount,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   443
                                  byte[] tgt, int tgtCount, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   444
        int min = tgtCount - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   445
        int i = min + fromIndex;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   446
        int strLastIndex = tgtCount - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   447
        char strLastChar = getChar(tgt, strLastIndex);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   448
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   449
    startSearchForLastChar:
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   450
        while (true) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   451
            while (i >= min && getChar(src, i) != strLastChar) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   452
                i--;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   453
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   454
            if (i < min) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   455
                return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   456
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   457
            int j = i - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   458
            int start = j - strLastIndex;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   459
            int k = strLastIndex - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   460
            while (j > start) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   461
                if (getChar(src, j--) != getChar(tgt, k--)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   462
                    i--;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   463
                    continue startSearchForLastChar;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   464
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   465
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   466
            return start + 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   467
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   468
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   469
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   470
    public static int lastIndexOf(byte[] value, int ch, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   471
        if (ch < Character.MIN_SUPPLEMENTARY_CODE_POINT) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   472
            // handle most cases here (ch is a BMP code point or a
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   473
            // negative value (invalid code point))
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   474
            int i = Math.min(fromIndex, (value.length >> 1) - 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   475
            for (; i >= 0; i--) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   476
                if (getChar(value, i) == ch) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   477
                    return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   478
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   479
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   480
            return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   481
        } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   482
            return lastIndexOfSupplementary(value, ch, fromIndex);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   483
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   484
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   485
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   486
    /**
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   487
     * Handles (rare) calls of lastIndexOf with a supplementary character.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   488
     */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   489
    private static int lastIndexOfSupplementary(final byte[] value, int ch, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   490
        if (Character.isValidCodePoint(ch)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   491
            char hi = Character.highSurrogate(ch);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   492
            char lo = Character.lowSurrogate(ch);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   493
            int i = Math.min(fromIndex, (value.length >> 1) - 2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   494
            for (; i >= 0; i--) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   495
                if (getChar(value, i) == hi && getChar(value, i + 1) == lo) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   496
                    return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   497
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   498
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   499
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   500
        return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   501
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   502
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   503
    public static String replace(byte[] value, char oldChar, char newChar) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   504
        int len = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   505
        int i = -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   506
        while (++i < len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   507
            if (getChar(value, i) == oldChar) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   508
                break;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   509
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   510
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   511
        if (i < len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   512
            byte buf[] = new byte[value.length];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   513
            for (int j = 0; j < i; j++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   514
                putChar(buf, j, getChar(value, j)); // TBD:arraycopy?
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   515
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   516
            while (i < len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   517
                char c = getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   518
                putChar(buf, i, c == oldChar ? newChar : c);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   519
                i++;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   520
           }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   521
           // Check if we should try to compress to latin1
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   522
           if (String.COMPACT_STRINGS &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   523
               !StringLatin1.canEncode(oldChar) &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   524
               StringLatin1.canEncode(newChar)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   525
               byte[] val = compress(buf, 0, len);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   526
               if (val != null) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   527
                   return new String(val, LATIN1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   528
               }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   529
           }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   530
           return new String(buf, UTF16);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   531
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   532
        return null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   533
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   534
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   535
    public static boolean regionMatchesCI(byte[] value, int toffset,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   536
                                          byte[] other, int ooffset, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   537
        int last = toffset + len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   538
        while (toffset < last) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   539
            char c1 = getChar(value, toffset++);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   540
            char c2 = getChar(other, ooffset++);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   541
            if (c1 == c2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   542
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   543
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   544
            // try converting both characters to uppercase.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   545
            // If the results match, then the comparison scan should
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   546
            // continue.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   547
            char u1 = Character.toUpperCase(c1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   548
            char u2 = Character.toUpperCase(c2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   549
            if (u1 == u2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   550
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   551
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   552
            // Unfortunately, conversion to uppercase does not work properly
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   553
            // for the Georgian alphabet, which has strange rules about case
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   554
            // conversion.  So we need to make one last check before
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   555
            // exiting.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   556
            if (Character.toLowerCase(u1) == Character.toLowerCase(u2)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   557
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   558
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   559
            return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   560
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   561
        return true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   562
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   563
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   564
    public static boolean regionMatchesCI_Latin1(byte[] value, int toffset,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   565
                                                 byte[] other, int ooffset,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   566
                                                 int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   567
        int last = toffset + len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   568
        while (toffset < last) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   569
            char c1 = getChar(value, toffset++);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   570
            char c2 = (char)(other[ooffset++] & 0xff);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   571
            if (c1 == c2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   572
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   573
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   574
            char u1 = Character.toUpperCase(c1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   575
            char u2 = Character.toUpperCase(c2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   576
            if (u1 == u2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   577
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   578
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   579
            if (Character.toLowerCase(u1) == Character.toLowerCase(u2)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   580
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   581
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   582
            return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   583
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   584
        return true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   585
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   586
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   587
    public static String toLowerCase(String str, byte[] value, Locale locale) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   588
        if (locale == null) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   589
            throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   590
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   591
        int first;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   592
        boolean hasSurr = false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   593
        final int len = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   594
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   595
        // Now check if there are any characters that need to be changed, or are surrogate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   596
        for (first = 0 ; first < len; first++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   597
            int cp = (int)getChar(value, first);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   598
            if (Character.isSurrogate((char)cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   599
                hasSurr = true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   600
                break;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   601
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   602
            if (cp != Character.toLowerCase(cp)) {  // no need to check Character.ERROR
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   603
                break;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   604
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   605
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   606
        if (first == len)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   607
            return str;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   608
        byte[] result = new byte[value.length];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   609
        System.arraycopy(value, 0, result, 0, first << 1);  // Just copy the first few
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   610
                                                            // lowerCase characters.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   611
        String lang = locale.getLanguage();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   612
        if (lang == "tr" || lang == "az" || lang == "lt") {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   613
            return toLowerCaseEx(str, value, result, first, locale, true);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   614
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   615
        if (hasSurr) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   616
            return toLowerCaseEx(str, value, result, first, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   617
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   618
        int bits = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   619
        for (int i = first; i < len; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   620
            int cp = (int)getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   621
            if (cp == '\u03A3' ||                       // GREEK CAPITAL LETTER SIGMA
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   622
                Character.isSurrogate((char)cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   623
                return toLowerCaseEx(str, value, result, i, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   624
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   625
            if (cp == '\u0130') {                       // LATIN CAPITAL LETTER I WITH DOT ABOVE
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   626
                return toLowerCaseEx(str, value, result, i, locale, true);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   627
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   628
            cp = Character.toLowerCase(cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   629
            if (!Character.isBmpCodePoint(cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   630
                return toLowerCaseEx(str, value, result, i, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   631
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   632
            bits |= cp;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   633
            putChar(result, i, cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   634
        }
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   635
        if (bits > 0xFF) {
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   636
            return new String(result, UTF16);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   637
        } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   638
            return newString(result, 0, len);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   639
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   640
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   641
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   642
    private static String toLowerCaseEx(String str, byte[] value,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   643
                                        byte[] result, int first, Locale locale,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   644
                                        boolean localeDependent) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   645
        int resultOffset = first;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   646
        int length = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   647
        int srcCount;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   648
        for (int i = first; i < length; i += srcCount) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   649
            int srcChar = getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   650
            int lowerChar;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   651
            char[] lowerCharArray;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   652
            srcCount = 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   653
            if (Character.isSurrogate((char)srcChar)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   654
                srcChar = codePointAt(value, i, length);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   655
                srcCount = Character.charCount(srcChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   656
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   657
            if (localeDependent ||
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   658
                srcChar == '\u03A3' ||  // GREEK CAPITAL LETTER SIGMA
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   659
                srcChar == '\u0130') {  // LATIN CAPITAL LETTER I WITH DOT ABOVE
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   660
                lowerChar = ConditionalSpecialCasing.toLowerCaseEx(str, i, locale);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   661
            } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   662
                lowerChar = Character.toLowerCase(srcChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   663
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   664
            if (Character.isBmpCodePoint(lowerChar)) {    // Character.ERROR is not a bmp
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   665
                putChar(result, resultOffset++, lowerChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   666
            } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   667
                if (lowerChar == Character.ERROR) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   668
                    lowerCharArray = ConditionalSpecialCasing.toLowerCaseCharArray(str, i, locale);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   669
                } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   670
                    lowerCharArray = Character.toChars(lowerChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   671
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   672
                /* Grow result if needed */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   673
                int mapLen = lowerCharArray.length;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   674
                if (mapLen > srcCount) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   675
                    byte[] result2 = newBytesFor((result.length >> 1) + mapLen - srcCount);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   676
                    System.arraycopy(result, 0, result2, 0, resultOffset << 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   677
                    result = result2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   678
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   679
                for (int x = 0; x < mapLen; ++x) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   680
                    putChar(result, resultOffset++, lowerCharArray[x]);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   681
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   682
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   683
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   684
        return newString(result, 0, resultOffset);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   685
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   686
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   687
    public static String toUpperCase(String str, byte[] value, Locale locale) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   688
        if (locale == null) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   689
            throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   690
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   691
        int first;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   692
        boolean hasSurr = false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   693
        final int len = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   694
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   695
        // Now check if there are any characters that need to be changed, or are surrogate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   696
        for (first = 0 ; first < len; first++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   697
            int cp = (int)getChar(value, first);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   698
            if (Character.isSurrogate((char)cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   699
                hasSurr = true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   700
                break;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   701
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   702
            if (cp != Character.toUpperCaseEx(cp)) {   // no need to check Character.ERROR
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   703
                break;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   704
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   705
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   706
        if (first == len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   707
            return str;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   708
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   709
        byte[] result = new byte[value.length];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   710
        System.arraycopy(value, 0, result, 0, first << 1); // Just copy the first few
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   711
                                                           // upperCase characters.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   712
        String lang = locale.getLanguage();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   713
        if (lang == "tr" || lang == "az" || lang == "lt") {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   714
            return toUpperCaseEx(str, value, result, first, locale, true);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   715
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   716
        if (hasSurr) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   717
            return toUpperCaseEx(str, value, result, first, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   718
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   719
        int bits = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   720
        for (int i = first; i < len; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   721
            int cp = (int)getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   722
            if (Character.isSurrogate((char)cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   723
                return toUpperCaseEx(str, value, result, i, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   724
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   725
            cp = Character.toUpperCaseEx(cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   726
            if (!Character.isBmpCodePoint(cp)) {    // Character.ERROR is not bmp
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   727
                return toUpperCaseEx(str, value, result, i, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   728
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   729
            bits |= cp;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   730
            putChar(result, i, cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   731
        }
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   732
        if (bits > 0xFF) {
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   733
            return new String(result, UTF16);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   734
        } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   735
            return newString(result, 0, len);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   736
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   737
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   738
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   739
    private static String toUpperCaseEx(String str, byte[] value,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   740
                                        byte[] result, int first,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   741
                                        Locale locale, boolean localeDependent)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   742
    {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   743
        int resultOffset = first;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   744
        int length = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   745
        int srcCount;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   746
        for (int i = first; i < length; i += srcCount) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   747
            int srcChar = getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   748
            int upperChar;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   749
            char[] upperCharArray;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   750
            srcCount = 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   751
            if (Character.isSurrogate((char)srcChar)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   752
                srcChar = codePointAt(value, i, length);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   753
                srcCount = Character.charCount(srcChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   754
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   755
            if (localeDependent) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   756
                upperChar = ConditionalSpecialCasing.toUpperCaseEx(str, i, locale);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   757
            } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   758
                upperChar = Character.toUpperCaseEx(srcChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   759
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   760
            if (Character.isBmpCodePoint(upperChar)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   761
                putChar(result, resultOffset++, upperChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   762
            } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   763
                if (upperChar == Character.ERROR) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   764
                    if (localeDependent) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   765
                        upperCharArray =
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   766
                            ConditionalSpecialCasing.toUpperCaseCharArray(str, i, locale);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   767
                    } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   768
                        upperCharArray = Character.toUpperCaseCharArray(srcChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   769
                    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   770
                } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   771
                    upperCharArray = Character.toChars(upperChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   772
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   773
                /* Grow result if needed */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   774
                int mapLen = upperCharArray.length;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   775
                if (mapLen > srcCount) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   776
                    byte[] result2 = newBytesFor((result.length >> 1) + mapLen - srcCount);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   777
                    System.arraycopy(result, 0, result2, 0, resultOffset << 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   778
                    result = result2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   779
                 }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   780
                 for (int x = 0; x < mapLen; ++x) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   781
                    putChar(result, resultOffset++, upperCharArray[x]);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   782
                 }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   783
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   784
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   785
        return newString(result, 0, resultOffset);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   786
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   787
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   788
    public static String trim(byte[] value) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   789
        int length = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   790
        int len = length;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   791
        int st = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   792
        while (st < len && getChar(value, st) <= ' ') {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   793
            st++;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   794
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   795
        while (st < len && getChar(value, len - 1) <= ' ') {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   796
            len--;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   797
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   798
        return ((st > 0) || (len < length )) ?
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   799
            new String(Arrays.copyOfRange(value, st << 1, len << 1), UTF16) :
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   800
            null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   801
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   802
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   803
    public static void putChars(byte[] val, int index, char[] str, int off, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   804
        while (off < end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   805
            putChar(val, index++, str[off++]);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   806
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   807
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   808
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   809
    public static String newString(byte[] val, int index, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   810
        if (String.COMPACT_STRINGS) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   811
            byte[] buf = compress(val, index, len);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   812
            if (buf != null) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   813
                return new String(buf, LATIN1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   814
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   815
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   816
        int last = index + len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   817
        return new String(Arrays.copyOfRange(val, index << 1, last << 1), UTF16);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   818
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   819
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   820
    public static void fillNull(byte[] val, int index, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   821
        Arrays.fill(val, index << 1, end << 1, (byte)0);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   822
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   823
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   824
    static class CharsSpliterator implements Spliterator.OfInt {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   825
        private final byte[] array;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   826
        private int index;        // current index, modified on advance/split
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   827
        private final int fence;  // one past last index
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   828
        private final int cs;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   829
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   830
        CharsSpliterator(byte[] array, int acs) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   831
            this(array, 0, array.length >> 1, acs);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   832
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   833
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   834
        CharsSpliterator(byte[] array, int origin, int fence, int acs) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   835
            this.array = array;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   836
            this.index = origin;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   837
            this.fence = fence;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   838
            this.cs = acs | Spliterator.ORDERED | Spliterator.SIZED
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   839
                      | Spliterator.SUBSIZED;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   840
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   841
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   842
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   843
        public OfInt trySplit() {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   844
            int lo = index, mid = (lo + fence) >>> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   845
            return (lo >= mid)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   846
                   ? null
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   847
                   : new CharsSpliterator(array, lo, index = mid, cs);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   848
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   849
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   850
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   851
        public void forEachRemaining(IntConsumer action) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   852
            byte[] a; int i, hi; // hoist accesses and checks from loop
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   853
            if (action == null)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   854
                throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   855
            if (((a = array).length >> 1) >= (hi = fence) &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   856
                (i = index) >= 0 && i < (index = hi)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   857
                do { action.accept(getChar(a, i)); } while (++i < hi);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   858
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   859
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   860
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   861
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   862
        public boolean tryAdvance(IntConsumer action) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   863
            if (action == null)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   864
                throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   865
            if (index >= 0 && index < fence) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   866
                action.accept(getChar(array, index++));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   867
                return true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   868
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   869
            return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   870
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   871
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   872
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   873
        public long estimateSize() { return (long)(fence - index); }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   874
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   875
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   876
        public int characteristics() {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   877
            return cs;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   878
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   879
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   880
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   881
    static class CodePointsSpliterator implements Spliterator.OfInt {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   882
        private final byte[] array;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   883
        private int index;        // current index, modified on advance/split
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   884
        private final int fence;  // one past last index
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   885
        private final int cs;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   886
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   887
        CodePointsSpliterator(byte[] array, int acs) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   888
            this(array, 0, array.length >> 1, acs);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   889
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   890
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   891
        CodePointsSpliterator(byte[] array, int origin, int fence, int acs) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   892
            this.array = array;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   893
            this.index = origin;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   894
            this.fence = fence;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   895
            this.cs = acs | Spliterator.ORDERED;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   896
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   897
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   898
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   899
        public OfInt trySplit() {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   900
            int lo = index, mid = (lo + fence) >>> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   901
            if (lo >= mid)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   902
                return null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   903
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   904
            int midOneLess;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   905
            // If the mid-point intersects a surrogate pair
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   906
            if (Character.isLowSurrogate(getChar(array, mid)) &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   907
                Character.isHighSurrogate(getChar(array, midOneLess = (mid -1)))) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   908
                // If there is only one pair it cannot be split
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   909
                if (lo >= midOneLess)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   910
                    return null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   911
                // Shift the mid-point to align with the surrogate pair
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   912
                return new CodePointsSpliterator(array, lo, index = midOneLess, cs);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   913
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   914
            return new CodePointsSpliterator(array, lo, index = mid, cs);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   915
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   916
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   917
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   918
        public void forEachRemaining(IntConsumer action) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   919
            byte[] a; int i, hi; // hoist accesses and checks from loop
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   920
            if (action == null)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   921
                throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   922
            if (((a = array).length >> 1) >= (hi = fence) &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   923
                (i = index) >= 0 && i < (index = hi)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   924
                do {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   925
                    i = advance(a, i, hi, action);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   926
                } while (i < hi);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   927
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   928
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   929
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   930
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   931
        public boolean tryAdvance(IntConsumer action) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   932
            if (action == null)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   933
                throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   934
            if (index >= 0 && index < fence) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   935
                index = advance(array, index, fence, action);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   936
                return true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   937
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   938
            return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   939
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   940
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   941
        // Advance one code point from the index, i, and return the next
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   942
        // index to advance from
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   943
        private static int advance(byte[] a, int i, int hi, IntConsumer action) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   944
            char c1 = getChar(a, i++);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   945
            int cp = c1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   946
            if (Character.isHighSurrogate(c1) && i < hi) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   947
                char c2 = getChar(a, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   948
                if (Character.isLowSurrogate(c2)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   949
                    i++;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   950
                    cp = Character.toCodePoint(c1, c2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   951
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   952
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   953
            action.accept(cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   954
            return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   955
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   956
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   957
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   958
        public long estimateSize() { return (long)(fence - index); }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   959
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   960
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   961
        public int characteristics() {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   962
            return cs;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   963
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   964
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   965
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   966
    ////////////////////////////////////////////////////////////////
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   967
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   968
    public static void putCharSB(byte[] val, int index, int c) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   969
        checkIndex(index, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   970
        putChar(val, index, c);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   971
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   972
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   973
    public static void putCharsSB(byte[] val, int index, char[] ca, int off, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   974
        checkOffset(index + end - off, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   975
        putChars(val, index, ca, off, end);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   976
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   977
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   978
    public static void putCharsSB(byte[] val, int index, CharSequence s, int off, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   979
        checkOffset(index + end - off, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   980
        for (int i = off; i < end; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   981
            putChar(val, index++, s.charAt(i));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   982
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   983
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   984
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   985
    public static int codePointAtSB(byte[] val, int index, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   986
        checkOffset(end, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   987
        return codePointAt(val, index, end);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   988
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   989
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   990
    public static int codePointBeforeSB(byte[] val, int index) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   991
        checkOffset(index, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   992
        return codePointBefore(val, index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   993
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   994
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   995
    public static int codePointCountSB(byte[] val, int beginIndex, int endIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   996
        checkOffset(endIndex, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   997
        return codePointCount(val, beginIndex, endIndex);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   998
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   999
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1000
    ////////////////////////////////////////////////////////////////
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1001
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1002
    private static native boolean isBigEndian();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1003
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1004
    static final int HI_BYTE_SHIFT;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1005
    static final int LO_BYTE_SHIFT;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1006
    static {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1007
        if (isBigEndian()) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1008
            HI_BYTE_SHIFT = 8;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1009
            LO_BYTE_SHIFT = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1010
        } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1011
            HI_BYTE_SHIFT = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1012
            LO_BYTE_SHIFT = 8;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1013
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1014
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1015
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1016
    static final int MAX_LENGTH = Integer.MAX_VALUE >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
  1017
}