jdk/src/java.base/share/classes/java/lang/StringUTF16.java
author psandoz
Thu, 01 Dec 2016 17:52:59 -0800
changeset 42346 c0c6d5d20c35
parent 39157 bba1e4c5c547
child 44642 331e669007f7
permissions -rw-r--r--
8170155: StringBuffer and StringBuilder stream methods are not late-binding Reviewed-by: sherman
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     1
/*
39157
bba1e4c5c547 8160264: Reuse Latin1/UTF16 compare routines
igerasim
parents: 38790
diff changeset
     2
 * Copyright (c) 2015, 2016, Oracle and/or its affiliates. All rights reserved.
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     4
 *
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     7
 * published by the Free Software Foundation.  Oracle designates this
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     8
 * particular file as subject to the "Classpath" exception as provided
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
     9
 * by Oracle in the LICENSE file that accompanied this code.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    10
 *
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    11
 * This code is distributed in the hope that it will be useful, but WITHOUT
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    12
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    13
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    14
 * version 2 for more details (a copy is included in the LICENSE file that
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    15
 * accompanied this code).
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    16
 *
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    17
 * You should have received a copy of the GNU General Public License version
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    18
 * 2 along with this work; if not, write to the Free Software Foundation,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    19
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    20
 *
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    21
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    22
 * or visit www.oracle.com if you need additional information or have any
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    23
 * questions.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    24
 */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    25
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    26
package java.lang;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    27
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    28
import java.util.Arrays;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    29
import java.util.Locale;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    30
import java.util.Spliterator;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    31
import java.util.function.IntConsumer;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    32
import jdk.internal.HotSpotIntrinsicCandidate;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    33
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    34
import static java.lang.String.UTF16;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    35
import static java.lang.String.LATIN1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    36
import static java.lang.String.checkIndex;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    37
import static java.lang.String.checkOffset;
34517
c6e795a80c80 8142303: C2 compilation fails with "bad AD file"
thartmann
parents: 33663
diff changeset
    38
import static java.lang.String.checkBoundsOffCount;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    39
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    40
final class StringUTF16 {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    41
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    42
    public static byte[] newBytesFor(int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    43
        if (len < 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    44
            throw new NegativeArraySizeException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    45
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    46
        if (len > MAX_LENGTH) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    47
            throw new OutOfMemoryError("UTF16 String size is " + len +
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    48
                                       ", should be less than " + MAX_LENGTH);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    49
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    50
        return new byte[len << 1];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    51
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    52
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    53
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    54
    public static void putChar(byte[] val, int index, int c) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    55
        index <<= 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    56
        val[index++] = (byte)(c >> HI_BYTE_SHIFT);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    57
        val[index]   = (byte)(c >> LO_BYTE_SHIFT);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    58
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    59
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    60
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    61
    public static char getChar(byte[] val, int index) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    62
        index <<= 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    63
        return (char)(((val[index++] & 0xff) << HI_BYTE_SHIFT) |
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    64
                      ((val[index]   & 0xff) << LO_BYTE_SHIFT));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    65
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    66
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    67
    public static char charAt(byte[] value, int index) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    68
        if (index < 0 || index >= value.length >> 1) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    69
            throw new StringIndexOutOfBoundsException(index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    70
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    71
        return getChar(value, index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    72
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    73
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    74
    public static int length(byte[] value) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    75
        return value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    76
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    77
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    78
    public static int codePointAt(byte[] value, int index, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    79
        char c1 = getChar(value, index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    80
        if (Character.isHighSurrogate(c1) && ++index < end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    81
            char c2 = getChar(value, index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    82
            if (Character.isLowSurrogate(c2)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    83
               return Character.toCodePoint(c1, c2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    84
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    85
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    86
        return c1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    87
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    88
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    89
    public static int codePointBefore(byte[] value, int index) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    90
        char c2 = getChar(value, --index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    91
        if (Character.isLowSurrogate(c2) && index > 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    92
            char c1 = getChar(value, --index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    93
            if (Character.isHighSurrogate(c1)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    94
               return Character.toCodePoint(c1, c2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    95
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    96
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    97
        return c2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    98
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
    99
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   100
    public static int codePointCount(byte[] value, int beginIndex, int endIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   101
        int count = endIndex - beginIndex;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   102
        for (int i = beginIndex; i < endIndex; ) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   103
            if (Character.isHighSurrogate(getChar(value, i++)) &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   104
                i < endIndex &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   105
                Character.isLowSurrogate(getChar(value, i))) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   106
                count--;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   107
                i++;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   108
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   109
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   110
        return count;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   111
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   112
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   113
    public static char[] toChars(byte[] value) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   114
        char[] dst = new char[value.length >> 1];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   115
        getChars(value, 0, dst.length, dst, 0);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   116
        return dst;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   117
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   118
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   119
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   120
    public static byte[] toBytes(char[] value, int off, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   121
        byte[] val = newBytesFor(len);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   122
        for (int i = 0; i < len; i++) {
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   123
            putChar(val, i, value[off]);
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   124
            off++;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   125
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   126
        return val;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   127
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   128
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   129
    public static byte[] compress(char[] val, int off, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   130
        byte[] ret = new byte[len];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   131
        if (compress(val, off, ret, 0, len) == len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   132
            return ret;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   133
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   134
        return null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   135
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   136
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   137
    public static byte[] compress(byte[] val, int off, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   138
        byte[] ret = new byte[len];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   139
        if (compress(val, off, ret, 0, len) == len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   140
            return ret;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   141
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   142
        return null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   143
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   144
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   145
    // compressedCopy char[] -> byte[]
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   146
    @HotSpotIntrinsicCandidate
38790
b74a24c96491 8155608: String intrinsic range checks are not strict enough
thartmann
parents: 36411
diff changeset
   147
    public static int compress(char[] src, int srcOff, byte[] dst, int dstOff, int len) {
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   148
        for (int i = 0; i < len; i++) {
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   149
            char c = src[srcOff];
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   150
            if (c > 0xFF) {
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   151
                len = 0;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   152
                break;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   153
            }
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   154
            dst[dstOff] = (byte)c;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   155
            srcOff++;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   156
            dstOff++;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   157
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   158
        return len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   159
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   160
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   161
    // compressedCopy byte[] -> byte[]
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   162
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   163
    public static int compress(byte[] src, int srcOff, byte[] dst, int dstOff, int len) {
34517
c6e795a80c80 8142303: C2 compilation fails with "bad AD file"
thartmann
parents: 33663
diff changeset
   164
        // We need a range check here because 'getChar' has no checks
38790
b74a24c96491 8155608: String intrinsic range checks are not strict enough
thartmann
parents: 36411
diff changeset
   165
        checkBoundsOffCount(srcOff << 1, len << 1, src.length);
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   166
        for (int i = 0; i < len; i++) {
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   167
            char c = getChar(src, srcOff);
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   168
            if (c > 0xFF) {
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   169
                len = 0;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   170
                break;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   171
            }
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   172
            dst[dstOff] = (byte)c;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   173
            srcOff++;
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   174
            dstOff++;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   175
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   176
        return len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   177
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   178
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   179
    public static byte[] toBytes(int[] val, int index, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   180
        final int end = index + len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   181
        // Pass 1: Compute precise size of char[]
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   182
        int n = len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   183
        for (int i = index; i < end; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   184
            int cp = val[i];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   185
            if (Character.isBmpCodePoint(cp))
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   186
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   187
            else if (Character.isValidCodePoint(cp))
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   188
                n++;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   189
            else throw new IllegalArgumentException(Integer.toString(cp));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   190
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   191
        // Pass 2: Allocate and fill in <high, low> pair
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   192
        byte[] buf = newBytesFor(n);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   193
        for (int i = index, j = 0; i < end; i++, j++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   194
            int cp = val[i];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   195
            if (Character.isBmpCodePoint(cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   196
                putChar(buf, j, cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   197
            } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   198
                putChar(buf, j++, Character.highSurrogate(cp));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   199
                putChar(buf, j, Character.lowSurrogate(cp));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   200
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   201
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   202
        return buf;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   203
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   204
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   205
    public static byte[] toBytes(char c) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   206
        byte[] result = new byte[2];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   207
        putChar(result, 0, c);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   208
        return result;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   209
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   210
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   211
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   212
    public static void getChars(byte[] value, int srcBegin, int srcEnd, char dst[], int dstBegin) {
34517
c6e795a80c80 8142303: C2 compilation fails with "bad AD file"
thartmann
parents: 33663
diff changeset
   213
        // We need a range check here because 'getChar' has no checks
38790
b74a24c96491 8155608: String intrinsic range checks are not strict enough
thartmann
parents: 36411
diff changeset
   214
        if (srcBegin < srcEnd) {
b74a24c96491 8155608: String intrinsic range checks are not strict enough
thartmann
parents: 36411
diff changeset
   215
            checkBoundsOffCount(srcBegin << 1, (srcEnd - srcBegin) << 1, value.length);
b74a24c96491 8155608: String intrinsic range checks are not strict enough
thartmann
parents: 36411
diff changeset
   216
        }
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   217
        for (int i = srcBegin; i < srcEnd; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   218
            dst[dstBegin++] = getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   219
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   220
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   221
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   222
    /* @see java.lang.String.getBytes(int, int, byte[], int) */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   223
    public static void getBytes(byte[] value, int srcBegin, int srcEnd, byte dst[], int dstBegin) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   224
        srcBegin <<= 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   225
        srcEnd <<= 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   226
        for (int i = srcBegin + (1 >> LO_BYTE_SHIFT); i < srcEnd; i += 2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   227
            dst[dstBegin++] = value[i];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   228
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   229
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   230
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   231
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   232
    public static boolean equals(byte[] value, byte[] other) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   233
        if (value.length == other.length) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   234
            int len = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   235
            for (int i = 0; i < len; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   236
                if (getChar(value, i) != getChar(other, i)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   237
                    return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   238
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   239
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   240
            return true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   241
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   242
        return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   243
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   244
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   245
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   246
    public static int compareTo(byte[] value, byte[] other) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   247
        int len1 = length(value);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   248
        int len2 = length(other);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   249
        int lim = Math.min(len1, len2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   250
        for (int k = 0; k < lim; k++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   251
            char c1 = getChar(value, k);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   252
            char c2 = getChar(other, k);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   253
            if (c1 != c2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   254
                return c1 - c2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   255
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   256
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   257
        return len1 - len2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   258
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   259
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   260
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   261
    public static int compareToLatin1(byte[] value, byte[] other) {
39157
bba1e4c5c547 8160264: Reuse Latin1/UTF16 compare routines
igerasim
parents: 38790
diff changeset
   262
        return -StringLatin1.compareToUTF16(other, value);
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   263
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   264
36411
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   265
    public static int compareToCI(byte[] value, byte[] other) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   266
        int len1 = length(value);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   267
        int len2 = length(other);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   268
        int lim = Math.min(len1, len2);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   269
        for (int k = 0; k < lim; k++) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   270
            char c1 = getChar(value, k);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   271
            char c2 = getChar(other, k);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   272
            if (c1 != c2) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   273
                c1 = Character.toUpperCase(c1);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   274
                c2 = Character.toUpperCase(c2);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   275
                if (c1 != c2) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   276
                    c1 = Character.toLowerCase(c1);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   277
                    c2 = Character.toLowerCase(c2);
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   278
                    if (c1 != c2) {
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   279
                        return c1 - c2;
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   280
                    }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   281
                }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   282
            }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   283
        }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   284
        return len1 - len2;
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   285
    }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   286
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   287
    public static int compareToCI_Latin1(byte[] value, byte[] other) {
39157
bba1e4c5c547 8160264: Reuse Latin1/UTF16 compare routines
igerasim
parents: 38790
diff changeset
   288
        return -StringLatin1.compareToCI_UTF16(other, value);
36411
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   289
    }
f0cd8358b5ea 8151384: Improve String.CASE_INSENSITIVE_ORDER and remove sun.misc.ASCIICaseInsensitiveComparator
chegar
parents: 34711
diff changeset
   290
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   291
    public static int hashCode(byte[] value) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   292
        int h = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   293
        int length = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   294
        for (int i = 0; i < length; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   295
            h = 31 * h + getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   296
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   297
        return h;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   298
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   299
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   300
    public static int indexOf(byte[] value, int ch, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   301
        int max = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   302
        if (fromIndex < 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   303
            fromIndex = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   304
        } else if (fromIndex >= max) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   305
            // Note: fromIndex might be near -1>>>1.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   306
            return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   307
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   308
        if (ch < Character.MIN_SUPPLEMENTARY_CODE_POINT) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   309
            // handle most cases here (ch is a BMP code point or a
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   310
            // negative value (invalid code point))
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   311
            return indexOfChar(value, ch, fromIndex, max);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   312
        } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   313
            return indexOfSupplementary(value, ch, fromIndex, max);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   314
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   315
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   316
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   317
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   318
    public static int indexOf(byte[] value, byte[] str) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   319
        if (str.length == 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   320
            return 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   321
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   322
        if (value.length == 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   323
            return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   324
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   325
        return indexOf(value, length(value), str, length(str), 0);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   326
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   327
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   328
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   329
    public static int indexOf(byte[] value, int valueCount, byte[] str, int strCount, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   330
        char first = getChar(str, 0);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   331
        int max = (valueCount - strCount);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   332
        for (int i = fromIndex; i <= max; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   333
            // Look for first character.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   334
            if (getChar(value, i) != first) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   335
                while (++i <= max && getChar(value, i) != first);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   336
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   337
            // Found first character, now look at the rest of value
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   338
            if (i <= max) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   339
                int j = i + 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   340
                int end = j + strCount - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   341
                for (int k = 1; j < end && getChar(value, j) == getChar(str, k); j++, k++);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   342
                if (j == end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   343
                    // Found whole string.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   344
                    return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   345
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   346
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   347
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   348
        return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   349
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   350
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   351
    /**
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   352
     * Handles indexOf Latin1 substring in UTF16 string.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   353
     */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   354
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   355
    public static int indexOfLatin1(byte[] value, byte[] str) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   356
        if (str.length == 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   357
            return 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   358
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   359
        if (value.length == 0) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   360
            return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   361
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   362
        return indexOfLatin1(value, length(value), str, str.length, 0);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   363
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   364
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   365
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   366
    public static int indexOfLatin1(byte[] src, int srcCount, byte[] tgt, int tgtCount, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   367
        char first = (char)(tgt[0] & 0xff);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   368
        int max = (srcCount - tgtCount);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   369
        for (int i = fromIndex; i <= max; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   370
            // Look for first character.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   371
            if (getChar(src, i) != first) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   372
                while (++i <= max && getChar(src, i) != first);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   373
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   374
            // Found first character, now look at the rest of v2
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   375
            if (i <= max) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   376
                int j = i + 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   377
                int end = j + tgtCount - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   378
                for (int k = 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   379
                     j < end && getChar(src, j) == (tgt[k] & 0xff);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   380
                     j++, k++);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   381
                if (j == end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   382
                    // Found whole string.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   383
                    return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   384
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   385
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   386
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   387
        return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   388
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   389
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   390
    @HotSpotIntrinsicCandidate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   391
    private static int indexOfChar(byte[] value, int ch, int fromIndex, int max) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   392
        for (int i = fromIndex; i < max; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   393
            if (getChar(value, i) == ch) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   394
                return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   395
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   396
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   397
        return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   398
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   399
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   400
    /**
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   401
     * Handles (rare) calls of indexOf with a supplementary character.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   402
     */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   403
    private static int indexOfSupplementary(byte[] value, int ch, int fromIndex, int max) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   404
        if (Character.isValidCodePoint(ch)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   405
            final char hi = Character.highSurrogate(ch);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   406
            final char lo = Character.lowSurrogate(ch);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   407
            for (int i = fromIndex; i < max - 1; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   408
                if (getChar(value, i) == hi && getChar(value, i + 1 ) == lo) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   409
                    return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   410
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   411
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   412
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   413
        return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   414
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   415
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   416
    public static int lastIndexOf(byte[] src, int srcCount,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   417
                                  byte[] tgt, int tgtCount, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   418
        int min = tgtCount - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   419
        int i = min + fromIndex;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   420
        int strLastIndex = tgtCount - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   421
        char strLastChar = getChar(tgt, strLastIndex);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   422
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   423
    startSearchForLastChar:
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   424
        while (true) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   425
            while (i >= min && getChar(src, i) != strLastChar) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   426
                i--;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   427
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   428
            if (i < min) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   429
                return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   430
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   431
            int j = i - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   432
            int start = j - strLastIndex;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   433
            int k = strLastIndex - 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   434
            while (j > start) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   435
                if (getChar(src, j--) != getChar(tgt, k--)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   436
                    i--;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   437
                    continue startSearchForLastChar;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   438
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   439
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   440
            return start + 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   441
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   442
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   443
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   444
    public static int lastIndexOf(byte[] value, int ch, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   445
        if (ch < Character.MIN_SUPPLEMENTARY_CODE_POINT) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   446
            // handle most cases here (ch is a BMP code point or a
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   447
            // negative value (invalid code point))
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   448
            int i = Math.min(fromIndex, (value.length >> 1) - 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   449
            for (; i >= 0; i--) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   450
                if (getChar(value, i) == ch) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   451
                    return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   452
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   453
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   454
            return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   455
        } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   456
            return lastIndexOfSupplementary(value, ch, fromIndex);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   457
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   458
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   459
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   460
    /**
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   461
     * Handles (rare) calls of lastIndexOf with a supplementary character.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   462
     */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   463
    private static int lastIndexOfSupplementary(final byte[] value, int ch, int fromIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   464
        if (Character.isValidCodePoint(ch)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   465
            char hi = Character.highSurrogate(ch);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   466
            char lo = Character.lowSurrogate(ch);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   467
            int i = Math.min(fromIndex, (value.length >> 1) - 2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   468
            for (; i >= 0; i--) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   469
                if (getChar(value, i) == hi && getChar(value, i + 1) == lo) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   470
                    return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   471
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   472
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   473
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   474
        return -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   475
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   476
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   477
    public static String replace(byte[] value, char oldChar, char newChar) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   478
        int len = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   479
        int i = -1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   480
        while (++i < len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   481
            if (getChar(value, i) == oldChar) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   482
                break;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   483
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   484
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   485
        if (i < len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   486
            byte buf[] = new byte[value.length];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   487
            for (int j = 0; j < i; j++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   488
                putChar(buf, j, getChar(value, j)); // TBD:arraycopy?
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   489
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   490
            while (i < len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   491
                char c = getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   492
                putChar(buf, i, c == oldChar ? newChar : c);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   493
                i++;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   494
           }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   495
           // Check if we should try to compress to latin1
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   496
           if (String.COMPACT_STRINGS &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   497
               !StringLatin1.canEncode(oldChar) &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   498
               StringLatin1.canEncode(newChar)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   499
               byte[] val = compress(buf, 0, len);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   500
               if (val != null) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   501
                   return new String(val, LATIN1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   502
               }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   503
           }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   504
           return new String(buf, UTF16);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   505
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   506
        return null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   507
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   508
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   509
    public static boolean regionMatchesCI(byte[] value, int toffset,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   510
                                          byte[] other, int ooffset, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   511
        int last = toffset + len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   512
        while (toffset < last) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   513
            char c1 = getChar(value, toffset++);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   514
            char c2 = getChar(other, ooffset++);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   515
            if (c1 == c2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   516
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   517
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   518
            // try converting both characters to uppercase.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   519
            // If the results match, then the comparison scan should
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   520
            // continue.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   521
            char u1 = Character.toUpperCase(c1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   522
            char u2 = Character.toUpperCase(c2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   523
            if (u1 == u2) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   524
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   525
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   526
            // Unfortunately, conversion to uppercase does not work properly
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   527
            // for the Georgian alphabet, which has strange rules about case
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   528
            // conversion.  So we need to make one last check before
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   529
            // exiting.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   530
            if (Character.toLowerCase(u1) == Character.toLowerCase(u2)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   531
                continue;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   532
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   533
            return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   534
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   535
        return true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   536
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   537
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   538
    public static boolean regionMatchesCI_Latin1(byte[] value, int toffset,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   539
                                                 byte[] other, int ooffset,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   540
                                                 int len) {
39157
bba1e4c5c547 8160264: Reuse Latin1/UTF16 compare routines
igerasim
parents: 38790
diff changeset
   541
        return StringLatin1.regionMatchesCI_UTF16(other, ooffset, value, toffset, len);
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   542
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   543
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   544
    public static String toLowerCase(String str, byte[] value, Locale locale) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   545
        if (locale == null) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   546
            throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   547
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   548
        int first;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   549
        boolean hasSurr = false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   550
        final int len = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   551
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   552
        // Now check if there are any characters that need to be changed, or are surrogate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   553
        for (first = 0 ; first < len; first++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   554
            int cp = (int)getChar(value, first);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   555
            if (Character.isSurrogate((char)cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   556
                hasSurr = true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   557
                break;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   558
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   559
            if (cp != Character.toLowerCase(cp)) {  // no need to check Character.ERROR
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   560
                break;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   561
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   562
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   563
        if (first == len)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   564
            return str;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   565
        byte[] result = new byte[value.length];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   566
        System.arraycopy(value, 0, result, 0, first << 1);  // Just copy the first few
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   567
                                                            // lowerCase characters.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   568
        String lang = locale.getLanguage();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   569
        if (lang == "tr" || lang == "az" || lang == "lt") {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   570
            return toLowerCaseEx(str, value, result, first, locale, true);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   571
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   572
        if (hasSurr) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   573
            return toLowerCaseEx(str, value, result, first, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   574
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   575
        int bits = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   576
        for (int i = first; i < len; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   577
            int cp = (int)getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   578
            if (cp == '\u03A3' ||                       // GREEK CAPITAL LETTER SIGMA
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   579
                Character.isSurrogate((char)cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   580
                return toLowerCaseEx(str, value, result, i, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   581
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   582
            if (cp == '\u0130') {                       // LATIN CAPITAL LETTER I WITH DOT ABOVE
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   583
                return toLowerCaseEx(str, value, result, i, locale, true);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   584
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   585
            cp = Character.toLowerCase(cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   586
            if (!Character.isBmpCodePoint(cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   587
                return toLowerCaseEx(str, value, result, i, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   588
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   589
            bits |= cp;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   590
            putChar(result, i, cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   591
        }
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   592
        if (bits > 0xFF) {
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   593
            return new String(result, UTF16);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   594
        } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   595
            return newString(result, 0, len);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   596
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   597
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   598
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   599
    private static String toLowerCaseEx(String str, byte[] value,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   600
                                        byte[] result, int first, Locale locale,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   601
                                        boolean localeDependent) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   602
        int resultOffset = first;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   603
        int length = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   604
        int srcCount;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   605
        for (int i = first; i < length; i += srcCount) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   606
            int srcChar = getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   607
            int lowerChar;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   608
            char[] lowerCharArray;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   609
            srcCount = 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   610
            if (Character.isSurrogate((char)srcChar)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   611
                srcChar = codePointAt(value, i, length);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   612
                srcCount = Character.charCount(srcChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   613
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   614
            if (localeDependent ||
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   615
                srcChar == '\u03A3' ||  // GREEK CAPITAL LETTER SIGMA
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   616
                srcChar == '\u0130') {  // LATIN CAPITAL LETTER I WITH DOT ABOVE
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   617
                lowerChar = ConditionalSpecialCasing.toLowerCaseEx(str, i, locale);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   618
            } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   619
                lowerChar = Character.toLowerCase(srcChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   620
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   621
            if (Character.isBmpCodePoint(lowerChar)) {    // Character.ERROR is not a bmp
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   622
                putChar(result, resultOffset++, lowerChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   623
            } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   624
                if (lowerChar == Character.ERROR) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   625
                    lowerCharArray = ConditionalSpecialCasing.toLowerCaseCharArray(str, i, locale);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   626
                } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   627
                    lowerCharArray = Character.toChars(lowerChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   628
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   629
                /* Grow result if needed */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   630
                int mapLen = lowerCharArray.length;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   631
                if (mapLen > srcCount) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   632
                    byte[] result2 = newBytesFor((result.length >> 1) + mapLen - srcCount);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   633
                    System.arraycopy(result, 0, result2, 0, resultOffset << 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   634
                    result = result2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   635
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   636
                for (int x = 0; x < mapLen; ++x) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   637
                    putChar(result, resultOffset++, lowerCharArray[x]);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   638
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   639
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   640
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   641
        return newString(result, 0, resultOffset);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   642
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   643
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   644
    public static String toUpperCase(String str, byte[] value, Locale locale) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   645
        if (locale == null) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   646
            throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   647
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   648
        int first;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   649
        boolean hasSurr = false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   650
        final int len = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   651
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   652
        // Now check if there are any characters that need to be changed, or are surrogate
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   653
        for (first = 0 ; first < len; first++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   654
            int cp = (int)getChar(value, first);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   655
            if (Character.isSurrogate((char)cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   656
                hasSurr = true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   657
                break;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   658
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   659
            if (cp != Character.toUpperCaseEx(cp)) {   // no need to check Character.ERROR
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   660
                break;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   661
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   662
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   663
        if (first == len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   664
            return str;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   665
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   666
        byte[] result = new byte[value.length];
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   667
        System.arraycopy(value, 0, result, 0, first << 1); // Just copy the first few
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   668
                                                           // upperCase characters.
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   669
        String lang = locale.getLanguage();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   670
        if (lang == "tr" || lang == "az" || lang == "lt") {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   671
            return toUpperCaseEx(str, value, result, first, locale, true);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   672
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   673
        if (hasSurr) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   674
            return toUpperCaseEx(str, value, result, first, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   675
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   676
        int bits = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   677
        for (int i = first; i < len; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   678
            int cp = (int)getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   679
            if (Character.isSurrogate((char)cp)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   680
                return toUpperCaseEx(str, value, result, i, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   681
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   682
            cp = Character.toUpperCaseEx(cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   683
            if (!Character.isBmpCodePoint(cp)) {    // Character.ERROR is not bmp
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   684
                return toUpperCaseEx(str, value, result, i, locale, false);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   685
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   686
            bits |= cp;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   687
            putChar(result, i, cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   688
        }
34711
65544417508e 8145428: Optimize StringUTF16 compress/copy methods for C1
shade
parents: 34517
diff changeset
   689
        if (bits > 0xFF) {
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   690
            return new String(result, UTF16);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   691
        } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   692
            return newString(result, 0, len);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   693
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   694
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   695
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   696
    private static String toUpperCaseEx(String str, byte[] value,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   697
                                        byte[] result, int first,
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   698
                                        Locale locale, boolean localeDependent)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   699
    {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   700
        int resultOffset = first;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   701
        int length = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   702
        int srcCount;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   703
        for (int i = first; i < length; i += srcCount) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   704
            int srcChar = getChar(value, i);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   705
            int upperChar;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   706
            char[] upperCharArray;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   707
            srcCount = 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   708
            if (Character.isSurrogate((char)srcChar)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   709
                srcChar = codePointAt(value, i, length);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   710
                srcCount = Character.charCount(srcChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   711
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   712
            if (localeDependent) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   713
                upperChar = ConditionalSpecialCasing.toUpperCaseEx(str, i, locale);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   714
            } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   715
                upperChar = Character.toUpperCaseEx(srcChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   716
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   717
            if (Character.isBmpCodePoint(upperChar)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   718
                putChar(result, resultOffset++, upperChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   719
            } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   720
                if (upperChar == Character.ERROR) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   721
                    if (localeDependent) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   722
                        upperCharArray =
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   723
                            ConditionalSpecialCasing.toUpperCaseCharArray(str, i, locale);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   724
                    } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   725
                        upperCharArray = Character.toUpperCaseCharArray(srcChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   726
                    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   727
                } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   728
                    upperCharArray = Character.toChars(upperChar);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   729
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   730
                /* Grow result if needed */
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   731
                int mapLen = upperCharArray.length;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   732
                if (mapLen > srcCount) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   733
                    byte[] result2 = newBytesFor((result.length >> 1) + mapLen - srcCount);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   734
                    System.arraycopy(result, 0, result2, 0, resultOffset << 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   735
                    result = result2;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   736
                 }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   737
                 for (int x = 0; x < mapLen; ++x) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   738
                    putChar(result, resultOffset++, upperCharArray[x]);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   739
                 }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   740
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   741
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   742
        return newString(result, 0, resultOffset);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   743
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   744
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   745
    public static String trim(byte[] value) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   746
        int length = value.length >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   747
        int len = length;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   748
        int st = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   749
        while (st < len && getChar(value, st) <= ' ') {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   750
            st++;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   751
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   752
        while (st < len && getChar(value, len - 1) <= ' ') {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   753
            len--;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   754
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   755
        return ((st > 0) || (len < length )) ?
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   756
            new String(Arrays.copyOfRange(value, st << 1, len << 1), UTF16) :
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   757
            null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   758
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   759
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   760
    public static void putChars(byte[] val, int index, char[] str, int off, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   761
        while (off < end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   762
            putChar(val, index++, str[off++]);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   763
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   764
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   765
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   766
    public static String newString(byte[] val, int index, int len) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   767
        if (String.COMPACT_STRINGS) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   768
            byte[] buf = compress(val, index, len);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   769
            if (buf != null) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   770
                return new String(buf, LATIN1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   771
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   772
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   773
        int last = index + len;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   774
        return new String(Arrays.copyOfRange(val, index << 1, last << 1), UTF16);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   775
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   776
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   777
    public static void fillNull(byte[] val, int index, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   778
        Arrays.fill(val, index << 1, end << 1, (byte)0);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   779
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   780
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   781
    static class CharsSpliterator implements Spliterator.OfInt {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   782
        private final byte[] array;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   783
        private int index;        // current index, modified on advance/split
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   784
        private final int fence;  // one past last index
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   785
        private final int cs;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   786
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   787
        CharsSpliterator(byte[] array, int acs) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   788
            this(array, 0, array.length >> 1, acs);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   789
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   790
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   791
        CharsSpliterator(byte[] array, int origin, int fence, int acs) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   792
            this.array = array;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   793
            this.index = origin;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   794
            this.fence = fence;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   795
            this.cs = acs | Spliterator.ORDERED | Spliterator.SIZED
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   796
                      | Spliterator.SUBSIZED;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   797
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   798
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   799
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   800
        public OfInt trySplit() {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   801
            int lo = index, mid = (lo + fence) >>> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   802
            return (lo >= mid)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   803
                   ? null
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   804
                   : new CharsSpliterator(array, lo, index = mid, cs);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   805
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   806
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   807
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   808
        public void forEachRemaining(IntConsumer action) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   809
            byte[] a; int i, hi; // hoist accesses and checks from loop
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   810
            if (action == null)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   811
                throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   812
            if (((a = array).length >> 1) >= (hi = fence) &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   813
                (i = index) >= 0 && i < (index = hi)) {
42346
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   814
                do {
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   815
                    action.accept(charAt(a, i));
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   816
                } while (++i < hi);
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   817
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   818
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   819
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   820
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   821
        public boolean tryAdvance(IntConsumer action) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   822
            if (action == null)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   823
                throw new NullPointerException();
42346
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   824
            int i = index;
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   825
            if (i >= 0 && i < fence) {
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   826
                action.accept(charAt(array, i));
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   827
                index++;
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   828
                return true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   829
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   830
            return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   831
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   832
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   833
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   834
        public long estimateSize() { return (long)(fence - index); }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   835
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   836
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   837
        public int characteristics() {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   838
            return cs;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   839
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   840
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   841
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   842
    static class CodePointsSpliterator implements Spliterator.OfInt {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   843
        private final byte[] array;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   844
        private int index;        // current index, modified on advance/split
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   845
        private final int fence;  // one past last index
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   846
        private final int cs;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   847
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   848
        CodePointsSpliterator(byte[] array, int acs) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   849
            this(array, 0, array.length >> 1, acs);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   850
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   851
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   852
        CodePointsSpliterator(byte[] array, int origin, int fence, int acs) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   853
            this.array = array;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   854
            this.index = origin;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   855
            this.fence = fence;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   856
            this.cs = acs | Spliterator.ORDERED;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   857
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   858
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   859
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   860
        public OfInt trySplit() {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   861
            int lo = index, mid = (lo + fence) >>> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   862
            if (lo >= mid)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   863
                return null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   864
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   865
            int midOneLess;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   866
            // If the mid-point intersects a surrogate pair
42346
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   867
            if (Character.isLowSurrogate(charAt(array, mid)) &&
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   868
                Character.isHighSurrogate(charAt(array, midOneLess = (mid -1)))) {
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   869
                // If there is only one pair it cannot be split
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   870
                if (lo >= midOneLess)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   871
                    return null;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   872
                // Shift the mid-point to align with the surrogate pair
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   873
                return new CodePointsSpliterator(array, lo, index = midOneLess, cs);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   874
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   875
            return new CodePointsSpliterator(array, lo, index = mid, cs);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   876
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   877
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   878
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   879
        public void forEachRemaining(IntConsumer action) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   880
            byte[] a; int i, hi; // hoist accesses and checks from loop
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   881
            if (action == null)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   882
                throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   883
            if (((a = array).length >> 1) >= (hi = fence) &&
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   884
                (i = index) >= 0 && i < (index = hi)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   885
                do {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   886
                    i = advance(a, i, hi, action);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   887
                } while (i < hi);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   888
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   889
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   890
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   891
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   892
        public boolean tryAdvance(IntConsumer action) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   893
            if (action == null)
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   894
                throw new NullPointerException();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   895
            if (index >= 0 && index < fence) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   896
                index = advance(array, index, fence, action);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   897
                return true;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   898
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   899
            return false;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   900
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   901
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   902
        // Advance one code point from the index, i, and return the next
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   903
        // index to advance from
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   904
        private static int advance(byte[] a, int i, int hi, IntConsumer action) {
42346
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   905
            char c1 = charAt(a, i++);
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   906
            int cp = c1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   907
            if (Character.isHighSurrogate(c1) && i < hi) {
42346
c0c6d5d20c35 8170155: StringBuffer and StringBuilder stream methods are not late-binding
psandoz
parents: 39157
diff changeset
   908
                char c2 = charAt(a, i);
33663
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   909
                if (Character.isLowSurrogate(c2)) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   910
                    i++;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   911
                    cp = Character.toCodePoint(c1, c2);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   912
                }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   913
            }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   914
            action.accept(cp);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   915
            return i;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   916
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   917
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   918
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   919
        public long estimateSize() { return (long)(fence - index); }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   920
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   921
        @Override
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   922
        public int characteristics() {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   923
            return cs;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   924
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   925
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   926
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   927
    ////////////////////////////////////////////////////////////////
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   928
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   929
    public static void putCharSB(byte[] val, int index, int c) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   930
        checkIndex(index, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   931
        putChar(val, index, c);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   932
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   933
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   934
    public static void putCharsSB(byte[] val, int index, char[] ca, int off, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   935
        checkOffset(index + end - off, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   936
        putChars(val, index, ca, off, end);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   937
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   938
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   939
    public static void putCharsSB(byte[] val, int index, CharSequence s, int off, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   940
        checkOffset(index + end - off, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   941
        for (int i = off; i < end; i++) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   942
            putChar(val, index++, s.charAt(i));
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   943
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   944
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   945
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   946
    public static int codePointAtSB(byte[] val, int index, int end) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   947
        checkOffset(end, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   948
        return codePointAt(val, index, end);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   949
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   950
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   951
    public static int codePointBeforeSB(byte[] val, int index) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   952
        checkOffset(index, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   953
        return codePointBefore(val, index);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   954
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   955
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   956
    public static int codePointCountSB(byte[] val, int beginIndex, int endIndex) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   957
        checkOffset(endIndex, val.length >> 1);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   958
        return codePointCount(val, beginIndex, endIndex);
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   959
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   960
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   961
    ////////////////////////////////////////////////////////////////
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   962
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   963
    private static native boolean isBigEndian();
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   964
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   965
    static final int HI_BYTE_SHIFT;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   966
    static final int LO_BYTE_SHIFT;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   967
    static {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   968
        if (isBigEndian()) {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   969
            HI_BYTE_SHIFT = 8;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   970
            LO_BYTE_SHIFT = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   971
        } else {
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   972
            HI_BYTE_SHIFT = 0;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   973
            LO_BYTE_SHIFT = 8;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   974
        }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   975
    }
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   976
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   977
    static final int MAX_LENGTH = Integer.MAX_VALUE >> 1;
2cd62a4bd471 8141132: JEP 254: Compact Strings
thartmann
parents:
diff changeset
   978
}