nashorn/src/jdk/nashorn/internal/runtime/regexp/RegExp.java
author hannesw
Thu, 22 Aug 2013 17:23:50 +0200
changeset 19621 1b2a79d8924c
parent 16525 1409942e618e
child 24778 2ff5d7041566
permissions -rw-r--r--
8023531: new RegExp('').toString() should return '/(?:)/' Reviewed-by: sundar, jlaskey
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
     1
/*
16151
97c1e756ae1e 8005663: Update copyright year to 2013
jlaskey
parents: 16147
diff changeset
     2
 * Copyright (c) 2010, 2013, Oracle and/or its affiliates. All rights reserved.
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
     4
 *
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
     7
 * published by the Free Software Foundation.  Oracle designates this
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
     8
 * particular file as subject to the "Classpath" exception as provided
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
     9
 * by Oracle in the LICENSE file that accompanied this code.
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    10
 *
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    11
 * This code is distributed in the hope that it will be useful, but WITHOUT
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    12
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    13
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    14
 * version 2 for more details (a copy is included in the LICENSE file that
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    15
 * accompanied this code).
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    16
 *
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    17
 * You should have received a copy of the GNU General Public License version
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    18
 * 2 along with this work; if not, write to the Free Software Foundation,
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    19
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    20
 *
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    21
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    22
 * or visit www.oracle.com if you need additional information or have any
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    23
 * questions.
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    24
 */
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    25
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    26
package jdk.nashorn.internal.runtime.regexp;
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    27
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    28
import jdk.nashorn.internal.runtime.BitVector;
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    29
import jdk.nashorn.internal.runtime.ECMAErrors;
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    30
import jdk.nashorn.internal.runtime.ParserException;
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    31
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    32
import java.util.regex.MatchResult;
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    33
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    34
/**
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    35
 * This is the base class for representing a parsed regular expression.
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    36
 *
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    37
 * Instances of this class are created by a {@link RegExpFactory}.
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    38
 */
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    39
public abstract class RegExp {
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    40
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    41
    /** Pattern string. */
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    42
    private final String source;
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    43
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    44
    /** Global search flag for this regexp.*/
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    45
    private boolean global;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    46
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    47
    /** Case insensitive flag for this regexp */
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    48
    private boolean ignoreCase;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    49
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    50
    /** Multi-line flag for this regexp */
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    51
    private boolean multiline;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    52
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    53
    /** BitVector that keeps track of groups in negative lookahead */
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    54
    protected BitVector groupsInNegativeLookahead;
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    55
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    56
    /**
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    57
     * Constructor.
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    58
     *
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    59
     * @param source the source string
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    60
     * @param flags the flags string
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    61
     */
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    62
    protected RegExp(final String source, final String flags) {
19621
1b2a79d8924c 8023531: new RegExp('').toString() should return '/(?:)/'
hannesw
parents: 16525
diff changeset
    63
        this.source = source.length() == 0 ? "(?:)" : source;
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    64
        for (int i = 0; i < flags.length(); i++) {
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    65
            final char ch = flags.charAt(i);
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    66
            switch (ch) {
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    67
            case 'g':
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    68
                if (this.global) {
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    69
                    throwParserException("repeated.flag", "g");
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    70
                }
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    71
                this.global = true;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    72
                break;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    73
            case 'i':
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    74
                if (this.ignoreCase) {
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    75
                    throwParserException("repeated.flag", "i");
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    76
                }
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    77
                this.ignoreCase = true;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    78
                break;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    79
            case 'm':
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    80
                if (this.multiline) {
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    81
                    throwParserException("repeated.flag", "m");
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    82
                }
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    83
                this.multiline = true;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    84
                break;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    85
            default:
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    86
                throwParserException("unsupported.flag", Character.toString(ch));
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    87
            }
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    88
        }
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    89
    }
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    90
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    91
    /**
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    92
     * Get the source pattern of this regular expression.
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    93
     *
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    94
     * @return the source string
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    95
     */
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    96
    public String getSource() {
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
    97
        return source;
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    98
    }
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
    99
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   100
    /**
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   101
     * Set the global flag of this regular expression to {@code global}.
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   102
     *
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   103
     * @param global the new global flag
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   104
     */
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   105
    public void setGlobal(final boolean global) {
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   106
        this.global = global;
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   107
    }
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   108
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   109
    /**
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   110
     * Get the global flag of this regular expression.
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   111
     *
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   112
     * @return the global flag
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   113
     */
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   114
    public boolean isGlobal() {
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   115
        return global;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   116
    }
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   117
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   118
    /**
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   119
     * Get the ignore-case flag of this regular expression.
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   120
     *
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   121
     * @return the ignore-case flag
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   122
     */
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   123
    public boolean isIgnoreCase() {
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   124
        return ignoreCase;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   125
    }
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   126
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   127
    /**
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   128
     * Get the multiline flag of this regular expression.
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   129
     *
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   130
     * @return the multiline flag
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   131
     */
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   132
    public boolean isMultiline() {
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   133
        return multiline;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   134
    }
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   135
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   136
    /**
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   137
     * Get a bitset indicating which of the groups in this regular expression are inside a negative lookahead.
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   138
     *
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   139
     * @return the groups-in-negative-lookahead bitset
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   140
     */
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   141
    public BitVector getGroupsInNegativeLookahead() {
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   142
        return groupsInNegativeLookahead;
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   143
    }
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   144
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   145
    /**
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   146
     * Match this regular expression against {@code str}, starting at index {@code start}
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   147
     * and return a {@link MatchResult} with the result.
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   148
     *
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   149
     * @param str the string
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   150
     * @return the matcher
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   151
     */
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   152
    public abstract RegExpMatcher match(String str);
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   153
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   154
    /**
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   155
     * Throw a regexp parser exception.
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   156
     *
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   157
     * @param key the message key
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   158
     * @param str string argument
16525
1409942e618e 8009982: Lazy execution bugfix. Added lazy sunspider unit test. Added mandreel to compile-octane test. Fixed warnings
lagergren
parents: 16258
diff changeset
   159
     * @throws jdk.nashorn.internal.runtime.ParserException unconditionally
16258
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   160
     */
0e25f785df4d 8008093: Make RegExp engine pluggable
hannesw
parents: 16226
diff changeset
   161
    protected static void throwParserException(final String key, final String str) throws ParserException {
16147
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   162
        throw new ParserException(ECMAErrors.getMessage("parser.error.regex." + key, str));
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   163
    }
e63b63819133 8005403: Open-source Nashorn
jlaskey
parents:
diff changeset
   164
}