langtools/src/jdk.compiler/share/classes/com/sun/tools/javac/parser/UnicodeReader.java
author jlahoda
Thu, 15 Jun 2017 13:44:42 +0200
changeset 45504 ea7475564d07
parent 25874 83c19f00452c
permissions -rw-r--r--
8170326: Inconsistencies between code, compiler.properties and comments Summary: Converting uses of Log and JCDiagnostic.Factory methods to use CompilerProperties instead of plain Strings, fixing inconsistencies, adding crules analyzer to ensure CompilerProperties are used whenever possible. Reviewed-by: mcimadamore
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     1
/*
15385
ee1eebe7e210 8006775: JSR 308: Compiler changes in JDK8
jjg
parents: 14259
diff changeset
     2
 * Copyright (c) 2011, 2013, Oracle and/or its affiliates. All rights reserved.
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     4
 *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     7
 * published by the Free Software Foundation.  Oracle designates this
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     8
 * particular file as subject to the "Classpath" exception as provided
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     9
 * by Oracle in the LICENSE file that accompanied this code.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    10
 *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    11
 * This code is distributed in the hope that it will be useful, but WITHOUT
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    12
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    13
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    14
 * version 2 for more details (a copy is included in the LICENSE file that
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    15
 * accompanied this code).
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    16
 *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    17
 * You should have received a copy of the GNU General Public License version
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    18
 * 2 along with this work; if not, write to the Free Software Foundation,
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    19
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    20
 *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    21
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    22
 * or visit www.oracle.com if you need additional information or have any
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    23
 * questions.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    24
 */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    25
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    26
package com.sun.tools.javac.parser;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    27
14049
3207422a0f9b 7193657: provide internal ArrayUtils class to simplify common usage of arrays in javac
jjg
parents: 10948
diff changeset
    28
import java.nio.CharBuffer;
3207422a0f9b 7193657: provide internal ArrayUtils class to simplify common usage of arrays in javac
jjg
parents: 10948
diff changeset
    29
import java.util.Arrays;
3207422a0f9b 7193657: provide internal ArrayUtils class to simplify common usage of arrays in javac
jjg
parents: 10948
diff changeset
    30
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    31
import com.sun.tools.javac.file.JavacFileManager;
45504
ea7475564d07 8170326: Inconsistencies between code, compiler.properties and comments
jlahoda
parents: 25874
diff changeset
    32
import com.sun.tools.javac.resources.CompilerProperties.Errors;
14049
3207422a0f9b 7193657: provide internal ArrayUtils class to simplify common usage of arrays in javac
jjg
parents: 10948
diff changeset
    33
import com.sun.tools.javac.util.ArrayUtils;
10948
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    34
import com.sun.tools.javac.util.Log;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    35
import com.sun.tools.javac.util.Name;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    36
import com.sun.tools.javac.util.Names;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    37
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    38
import static com.sun.tools.javac.util.LayoutCharacters.*;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    39
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    40
/** The char reader used by the javac lexer/tokenizer. Returns the sequence of
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    41
 * characters contained in the input stream, handling unicode escape accordingly.
15385
ee1eebe7e210 8006775: JSR 308: Compiler changes in JDK8
jjg
parents: 14259
diff changeset
    42
 * Additionally, it provides features for saving chars into a buffer and to retrieve
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    43
 * them at a later stage.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    44
 *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    45
 *  <p><b>This is NOT part of any supported API.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    46
 *  If you write code that depends on this, you do so at your own risk.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    47
 *  This code and its internal interfaces are subject to change or
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    48
 *  deletion without notice.</b>
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    49
 */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    50
public class UnicodeReader {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    51
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    52
    /** The input buffer, index of next character to be read,
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    53
     *  index of one past last character in buffer.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    54
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    55
    protected char[] buf;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    56
    protected int bp;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    57
    protected final int buflen;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    58
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    59
    /** The current character.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    60
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    61
    protected char ch;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    62
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    63
    /** The buffer index of the last converted unicode character
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    64
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    65
    protected int unicodeConversionBp = -1;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    66
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    67
    protected Log log;
10948
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    68
    protected Names names;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    69
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    70
    /** A character buffer for saved chars.
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    71
     */
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    72
    protected char[] sbuf = new char[128];
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    73
    protected int sp;
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    74
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    75
    /**
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    76
     * Create a scanner from the input array.  This method might
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    77
     * modify the array.  To avoid copying the input array, ensure
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    78
     * that {@code inputLength < input.length} or
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    79
     * {@code input[input.length -1]} is a white space character.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    80
     *
14259
fb94a1df0d53 8000208: fix langtools javadoc comment issues
jjg
parents: 14049
diff changeset
    81
     * @param sf the factory which created this Scanner
fb94a1df0d53 8000208: fix langtools javadoc comment issues
jjg
parents: 14049
diff changeset
    82
     * @param buffer the input, might be modified
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    83
     * Must be positive and less than or equal to input.length.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    84
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    85
    protected UnicodeReader(ScannerFactory sf, CharBuffer buffer) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    86
        this(sf, JavacFileManager.toArray(buffer), buffer.limit());
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    87
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    88
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    89
    protected UnicodeReader(ScannerFactory sf, char[] input, int inputLength) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    90
        log = sf.log;
10948
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    91
        names = sf.names;
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    92
        if (inputLength == input.length) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    93
            if (input.length > 0 && Character.isWhitespace(input[input.length - 1])) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    94
                inputLength--;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    95
            } else {
14049
3207422a0f9b 7193657: provide internal ArrayUtils class to simplify common usage of arrays in javac
jjg
parents: 10948
diff changeset
    96
                input = Arrays.copyOf(input, inputLength + 1);
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    97
            }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    98
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    99
        buf = input;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   100
        buflen = inputLength;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   101
        buf[buflen] = EOI;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   102
        bp = -1;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   103
        scanChar();
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   104
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   105
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   106
    /** Read next character.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   107
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   108
    protected void scanChar() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   109
        if (bp < buflen) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   110
            ch = buf[++bp];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   111
            if (ch == '\\') {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   112
                convertUnicode();
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   113
            }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   114
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   115
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   116
10948
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   117
    /** Read next character in comment, skipping over double '\' characters.
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   118
     */
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   119
    protected void scanCommentChar() {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   120
        scanChar();
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   121
        if (ch == '\\') {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   122
            if (peekChar() == '\\' && !isUnicode()) {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   123
                skipChar();
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   124
            } else {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   125
                convertUnicode();
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   126
            }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   127
        }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   128
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   129
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   130
    /** Append a character to sbuf.
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   131
     */
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   132
    protected void putChar(char ch, boolean scan) {
14049
3207422a0f9b 7193657: provide internal ArrayUtils class to simplify common usage of arrays in javac
jjg
parents: 10948
diff changeset
   133
        sbuf = ArrayUtils.ensureCapacity(sbuf, sp);
10948
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   134
        sbuf[sp++] = ch;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   135
        if (scan)
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   136
            scanChar();
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   137
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   138
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   139
    protected void putChar(char ch) {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   140
        putChar(ch, false);
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   141
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   142
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   143
    protected void putChar(boolean scan) {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   144
        putChar(ch, scan);
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   145
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   146
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   147
    Name name() {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   148
        return names.fromChars(sbuf, 0, sp);
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   149
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   150
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   151
    String chars() {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   152
        return new String(sbuf, 0, sp);
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   153
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   154
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   155
    /** Convert unicode escape; bp points to initial '\' character
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   156
     *  (Spec 3.3).
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   157
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   158
    protected void convertUnicode() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   159
        if (ch == '\\' && unicodeConversionBp != bp) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   160
            bp++; ch = buf[bp];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   161
            if (ch == 'u') {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   162
                do {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   163
                    bp++; ch = buf[bp];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   164
                } while (ch == 'u');
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   165
                int limit = bp + 3;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   166
                if (limit < buflen) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   167
                    int d = digit(bp, 16);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   168
                    int code = d;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   169
                    while (bp < limit && d >= 0) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   170
                        bp++; ch = buf[bp];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   171
                        d = digit(bp, 16);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   172
                        code = (code << 4) + d;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   173
                    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   174
                    if (d >= 0) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   175
                        ch = (char)code;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   176
                        unicodeConversionBp = bp;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   177
                        return;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   178
                    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   179
                }
45504
ea7475564d07 8170326: Inconsistencies between code, compiler.properties and comments
jlahoda
parents: 25874
diff changeset
   180
                log.error(bp, Errors.IllegalUnicodeEsc);
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   181
            } else {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   182
                bp--;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   183
                ch = '\\';
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   184
            }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   185
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   186
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   187
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   188
    /** Are surrogates supported?
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   189
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   190
    final static boolean surrogatesSupported = surrogatesSupported();
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   191
    private static boolean surrogatesSupported() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   192
        try {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   193
            Character.isHighSurrogate('a');
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   194
            return true;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   195
        } catch (NoSuchMethodError ex) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   196
            return false;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   197
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   198
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   199
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   200
    /** Scan surrogate pairs.  If 'ch' is a high surrogate and
25600
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   201
     *  the next character is a low surrogate, returns the code point
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   202
     *  constructed from these surrogates. Otherwise, returns -1.
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   203
     *  This method will not consume any of the characters.
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   204
     */
25600
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   205
    protected int peekSurrogates() {
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   206
        if (surrogatesSupported && Character.isHighSurrogate(ch)) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   207
            char high = ch;
25600
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   208
            int prevBP = bp;
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   209
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   210
            scanChar();
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   211
25600
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   212
            char low = ch;
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   213
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   214
            ch = high;
25600
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   215
            bp = prevBP;
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   216
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   217
            if (Character.isLowSurrogate(low)) {
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   218
                return Character.toCodePoint(high, low);
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   219
            }
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   220
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   221
25600
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   222
        return -1;
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   223
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   224
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   225
    /** Convert an ASCII digit from its base (8, 10, or 16)
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   226
     *  to its value.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   227
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   228
    protected int digit(int pos, int base) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   229
        char c = ch;
25600
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   230
        if ('0' <= c && c <= '9')
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   231
            return Character.digit(c, base); //a fast common case
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   232
        int codePoint = peekSurrogates();
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   233
        int result = codePoint >= 0 ? Character.digit(codePoint, base) : Character.digit(c, base);
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   234
        if (result >= 0 && c > 0x7f) {
45504
ea7475564d07 8170326: Inconsistencies between code, compiler.properties and comments
jlahoda
parents: 25874
diff changeset
   235
            log.error(pos + 1, Errors.IllegalNonasciiDigit);
25600
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   236
            if (codePoint >= 0)
7f93cb0536fd 8048805: Request to investigate and update lexer error recovery in javac
jlahoda
parents: 15385
diff changeset
   237
                scanChar();
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   238
            ch = "0123456789abcdef".charAt(result);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   239
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   240
        return result;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   241
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   242
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   243
    protected boolean isUnicode() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   244
        return unicodeConversionBp == bp;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   245
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   246
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   247
    protected void skipChar() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   248
        bp++;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   249
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   250
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   251
    protected char peekChar() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   252
        return buf[bp + 1];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   253
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   254
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   255
    /**
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   256
     * Returns a copy of the input buffer, up to its inputLength.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   257
     * Unicode escape sequences are not translated.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   258
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   259
    public char[] getRawCharacters() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   260
        char[] chars = new char[buflen];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   261
        System.arraycopy(buf, 0, chars, 0, buflen);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   262
        return chars;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   263
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   264
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   265
    /**
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   266
     * Returns a copy of a character array subset of the input buffer.
14259
fb94a1df0d53 8000208: fix langtools javadoc comment issues
jjg
parents: 14049
diff changeset
   267
     * The returned array begins at the {@code beginIndex} and
fb94a1df0d53 8000208: fix langtools javadoc comment issues
jjg
parents: 14049
diff changeset
   268
     * extends to the character at index {@code endIndex - 1}.
fb94a1df0d53 8000208: fix langtools javadoc comment issues
jjg
parents: 14049
diff changeset
   269
     * Thus the length of the substring is {@code endIndex-beginIndex}.
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   270
     * This behavior is like
14259
fb94a1df0d53 8000208: fix langtools javadoc comment issues
jjg
parents: 14049
diff changeset
   271
     * {@code String.substring(beginIndex, endIndex)}.
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   272
     * Unicode escape sequences are not translated.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   273
     *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   274
     * @param beginIndex the beginning index, inclusive.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   275
     * @param endIndex the ending index, exclusive.
14259
fb94a1df0d53 8000208: fix langtools javadoc comment issues
jjg
parents: 14049
diff changeset
   276
     * @throws ArrayIndexOutOfBoundsException if either offset is outside of the
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   277
     *         array bounds
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   278
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   279
    public char[] getRawCharacters(int beginIndex, int endIndex) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   280
        int length = endIndex - beginIndex;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   281
        char[] chars = new char[length];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   282
        System.arraycopy(buf, beginIndex, chars, 0, length);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   283
        return chars;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   284
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   285
}