langtools/src/share/classes/com/sun/tools/javac/parser/UnicodeReader.java
author mcimadamore
Fri, 04 Nov 2011 12:36:40 +0000
changeset 10948 063463f6535f
parent 10815 a719aa5f1631
child 14049 3207422a0f9b
permissions -rw-r--r--
7104201: Refactor DocCommentScanner Summary: Add new Comment helper class to parse contents of comments in source code Reviewed-by: jjg
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     1
/*
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     2
 * Copyright (c) 2011, Oracle and/or its affiliates. All rights reserved.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     4
 *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     7
 * published by the Free Software Foundation.  Oracle designates this
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     8
 * particular file as subject to the "Classpath" exception as provided
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
     9
 * by Oracle in the LICENSE file that accompanied this code.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    10
 *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    11
 * This code is distributed in the hope that it will be useful, but WITHOUT
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    12
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    13
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    14
 * version 2 for more details (a copy is included in the LICENSE file that
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    15
 * accompanied this code).
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    16
 *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    17
 * You should have received a copy of the GNU General Public License version
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    18
 * 2 along with this work; if not, write to the Free Software Foundation,
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    19
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    20
 *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    21
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    22
 * or visit www.oracle.com if you need additional information or have any
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    23
 * questions.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    24
 */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    25
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    26
package com.sun.tools.javac.parser;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    27
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    28
import com.sun.tools.javac.file.JavacFileManager;
10948
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    29
import com.sun.tools.javac.util.Log;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    30
import com.sun.tools.javac.util.Name;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    31
import com.sun.tools.javac.util.Names;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    32
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    33
import java.nio.CharBuffer;
10948
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    34
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    35
import static com.sun.tools.javac.util.LayoutCharacters.*;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    36
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    37
/** The char reader used by the javac lexer/tokenizer. Returns the sequence of
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    38
 * characters contained in the input stream, handling unicode escape accordingly.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    39
 * Additionally, it provide features for saving chars into a buffer and to retrieve
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    40
 * them at a later stage.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    41
 *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    42
 *  <p><b>This is NOT part of any supported API.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    43
 *  If you write code that depends on this, you do so at your own risk.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    44
 *  This code and its internal interfaces are subject to change or
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    45
 *  deletion without notice.</b>
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    46
 */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    47
public class UnicodeReader {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    48
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    49
    /** The input buffer, index of next character to be read,
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    50
     *  index of one past last character in buffer.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    51
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    52
    protected char[] buf;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    53
    protected int bp;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    54
    protected final int buflen;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    55
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    56
    /** The current character.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    57
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    58
    protected char ch;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    59
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    60
    /** The buffer index of the last converted unicode character
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    61
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    62
    protected int unicodeConversionBp = -1;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    63
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    64
    protected Log log;
10948
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    65
    protected Names names;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    66
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    67
    /** A character buffer for saved chars.
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    68
     */
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    69
    protected char[] sbuf = new char[128];
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    70
    protected int sp;
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    71
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    72
    /**
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    73
     * Create a scanner from the input array.  This method might
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    74
     * modify the array.  To avoid copying the input array, ensure
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    75
     * that {@code inputLength < input.length} or
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    76
     * {@code input[input.length -1]} is a white space character.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    77
     *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    78
     * @param fac the factory which created this Scanner
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    79
     * @param input the input, might be modified
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    80
     * @param inputLength the size of the input.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    81
     * Must be positive and less than or equal to input.length.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    82
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    83
    protected UnicodeReader(ScannerFactory sf, CharBuffer buffer) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    84
        this(sf, JavacFileManager.toArray(buffer), buffer.limit());
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    85
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    86
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    87
    protected UnicodeReader(ScannerFactory sf, char[] input, int inputLength) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    88
        log = sf.log;
10948
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
    89
        names = sf.names;
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    90
        if (inputLength == input.length) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    91
            if (input.length > 0 && Character.isWhitespace(input[input.length - 1])) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    92
                inputLength--;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    93
            } else {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    94
                char[] newInput = new char[inputLength + 1];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    95
                System.arraycopy(input, 0, newInput, 0, input.length);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    96
                input = newInput;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    97
            }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    98
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
    99
        buf = input;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   100
        buflen = inputLength;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   101
        buf[buflen] = EOI;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   102
        bp = -1;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   103
        scanChar();
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   104
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   105
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   106
    /** Read next character.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   107
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   108
    protected void scanChar() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   109
        if (bp < buflen) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   110
            ch = buf[++bp];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   111
            if (ch == '\\') {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   112
                convertUnicode();
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   113
            }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   114
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   115
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   116
10948
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   117
    /** Read next character in comment, skipping over double '\' characters.
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   118
     */
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   119
    protected void scanCommentChar() {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   120
        scanChar();
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   121
        if (ch == '\\') {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   122
            if (peekChar() == '\\' && !isUnicode()) {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   123
                skipChar();
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   124
            } else {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   125
                convertUnicode();
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   126
            }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   127
        }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   128
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   129
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   130
    /** Append a character to sbuf.
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   131
     */
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   132
    protected void putChar(char ch, boolean scan) {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   133
        if (sp == sbuf.length) {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   134
            char[] newsbuf = new char[sbuf.length * 2];
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   135
            System.arraycopy(sbuf, 0, newsbuf, 0, sbuf.length);
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   136
            sbuf = newsbuf;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   137
        }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   138
        sbuf[sp++] = ch;
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   139
        if (scan)
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   140
            scanChar();
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   141
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   142
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   143
    protected void putChar(char ch) {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   144
        putChar(ch, false);
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   145
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   146
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   147
    protected void putChar(boolean scan) {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   148
        putChar(ch, scan);
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   149
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   150
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   151
    Name name() {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   152
        return names.fromChars(sbuf, 0, sp);
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   153
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   154
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   155
    String chars() {
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   156
        return new String(sbuf, 0, sp);
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   157
    }
063463f6535f 7104201: Refactor DocCommentScanner
mcimadamore
parents: 10815
diff changeset
   158
10815
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   159
    /** Convert unicode escape; bp points to initial '\' character
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   160
     *  (Spec 3.3).
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   161
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   162
    protected void convertUnicode() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   163
        if (ch == '\\' && unicodeConversionBp != bp) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   164
            bp++; ch = buf[bp];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   165
            if (ch == 'u') {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   166
                do {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   167
                    bp++; ch = buf[bp];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   168
                } while (ch == 'u');
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   169
                int limit = bp + 3;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   170
                if (limit < buflen) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   171
                    int d = digit(bp, 16);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   172
                    int code = d;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   173
                    while (bp < limit && d >= 0) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   174
                        bp++; ch = buf[bp];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   175
                        d = digit(bp, 16);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   176
                        code = (code << 4) + d;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   177
                    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   178
                    if (d >= 0) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   179
                        ch = (char)code;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   180
                        unicodeConversionBp = bp;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   181
                        return;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   182
                    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   183
                }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   184
                log.error(bp, "illegal.unicode.esc");
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   185
            } else {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   186
                bp--;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   187
                ch = '\\';
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   188
            }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   189
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   190
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   191
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   192
    /** Are surrogates supported?
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   193
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   194
    final static boolean surrogatesSupported = surrogatesSupported();
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   195
    private static boolean surrogatesSupported() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   196
        try {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   197
            Character.isHighSurrogate('a');
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   198
            return true;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   199
        } catch (NoSuchMethodError ex) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   200
            return false;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   201
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   202
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   203
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   204
    /** Scan surrogate pairs.  If 'ch' is a high surrogate and
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   205
     *  the next character is a low surrogate, then put the low
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   206
     *  surrogate in 'ch', and return the high surrogate.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   207
     *  otherwise, just return 0.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   208
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   209
    protected char scanSurrogates() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   210
        if (surrogatesSupported && Character.isHighSurrogate(ch)) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   211
            char high = ch;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   212
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   213
            scanChar();
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   214
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   215
            if (Character.isLowSurrogate(ch)) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   216
                return high;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   217
            }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   218
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   219
            ch = high;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   220
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   221
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   222
        return 0;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   223
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   224
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   225
    /** Convert an ASCII digit from its base (8, 10, or 16)
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   226
     *  to its value.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   227
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   228
    protected int digit(int pos, int base) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   229
        char c = ch;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   230
        int result = Character.digit(c, base);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   231
        if (result >= 0 && c > 0x7f) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   232
            log.error(pos + 1, "illegal.nonascii.digit");
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   233
            ch = "0123456789abcdef".charAt(result);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   234
        }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   235
        return result;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   236
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   237
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   238
    protected boolean isUnicode() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   239
        return unicodeConversionBp == bp;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   240
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   241
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   242
    protected void skipChar() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   243
        bp++;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   244
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   245
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   246
    protected char peekChar() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   247
        return buf[bp + 1];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   248
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   249
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   250
    /**
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   251
     * Returns a copy of the input buffer, up to its inputLength.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   252
     * Unicode escape sequences are not translated.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   253
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   254
    public char[] getRawCharacters() {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   255
        char[] chars = new char[buflen];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   256
        System.arraycopy(buf, 0, chars, 0, buflen);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   257
        return chars;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   258
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   259
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   260
    /**
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   261
     * Returns a copy of a character array subset of the input buffer.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   262
     * The returned array begins at the <code>beginIndex</code> and
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   263
     * extends to the character at index <code>endIndex - 1</code>.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   264
     * Thus the length of the substring is <code>endIndex-beginIndex</code>.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   265
     * This behavior is like
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   266
     * <code>String.substring(beginIndex, endIndex)</code>.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   267
     * Unicode escape sequences are not translated.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   268
     *
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   269
     * @param beginIndex the beginning index, inclusive.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   270
     * @param endIndex the ending index, exclusive.
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   271
     * @throws IndexOutOfBounds if either offset is outside of the
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   272
     *         array bounds
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   273
     */
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   274
    public char[] getRawCharacters(int beginIndex, int endIndex) {
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   275
        int length = endIndex - beginIndex;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   276
        char[] chars = new char[length];
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   277
        System.arraycopy(buf, beginIndex, chars, 0, length);
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   278
        return chars;
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   279
    }
a719aa5f1631 7096014: Javac tokens should retain state
mcimadamore
parents:
diff changeset
   280
}