test/jdk/java/util/regex/RegExTest.java
author naoto
Thu, 23 May 2019 12:21:21 -0700
changeset 55013 8dae495a59e7
parent 49763 1ccf5fae9664
child 55096 234673929e0a
child 58678 9cf78a70fa4f
permissions -rw-r--r--
8221431: Support for Unicode 12.1 Reviewed-by: erikj, rriggs
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     1
/*
48491
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
     2
 * Copyright (c) 1999, 2018, Oracle and/or its affiliates. All rights reserved.
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     4
 *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
21596
0e3a39f29dbc 8027696: Incorrect copyright header in the tests
serb
parents: 19604
diff changeset
     7
 * published by the Free Software Foundation.
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     8
 *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     9
 * This code is distributed in the hope that it will be useful, but WITHOUT
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    12
 * version 2 for more details (a copy is included in the LICENSE file that
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    13
 * accompanied this code).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    14
 *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    15
 * You should have received a copy of the GNU General Public License version
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    16
 * 2 along with this work; if not, write to the Free Software Foundation,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    18
 *
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 5295
diff changeset
    19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 5295
diff changeset
    20
 * or visit www.oracle.com if you need additional information or have any
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 5295
diff changeset
    21
 * questions.
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    22
 */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    23
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    24
/**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    25
 * @test
30370
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    26
 * @summary tests RegExp framework (use -Dseed=X to set PRNG seed)
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    27
 * @author Mike McCloskey
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    28
 * @bug 4481568 4482696 4495089 4504687 4527731 4599621 4631553 4619345
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    29
 * 4630911 4672616 4711773 4727935 4750573 4792284 4803197 4757029 4808962
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    30
 * 4872664 4803179 4892980 4900747 4945394 4938995 4979006 4994840 4997476
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    31
 * 5013885 5003322 4988891 5098443 5110268 6173522 4829857 5027748 6376940
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    32
 * 6358731 6178785 6284152 6231989 6497148 6486934 6233084 6504326 6635133
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
    33
 * 6350801 6676425 6878475 6919132 6931676 6948903 6990617 7014645 7039066
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
    34
 * 7067045 7014640 7189363 8007395 8013252 8013254 8012646 8023647 6559590
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
    35
 * 8027645 8035076 8039124 8035975 8074678 6854417 8143854 8147531 7071819
45888
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
    36
 * 8151481 4867170 7080302 6728861 6995635 6736245 4916384 6328855 6192895
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
    37
 * 6345469 6988218 6693451 7006761 8140212 8143282 8158482 8176029 8184706
55013
8dae495a59e7 8221431: Support for Unicode 12.1
naoto
parents: 49763
diff changeset
    38
 * 8194667 8197462 8184692 8221431
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
    39
 *
45288
58be10a068c2 8180805: move RandomFactory to the top level testlibrary
iignatyev
parents: 44122
diff changeset
    40
 * @library /test/lib
55013
8dae495a59e7 8221431: Support for Unicode 12.1
naoto
parents: 49763
diff changeset
    41
 * @library /lib/testlibrary/java/lang
45466
faf1c55d2046 8181759: add explicit @build actions for jdk.test.lib classes in all :tier1 tests
iignatyev
parents: 45288
diff changeset
    42
 * @build jdk.test.lib.RandomFactory
30370
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    43
 * @run main RegExTest
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
    44
 * @key randomness
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    45
 */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    46
29243
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
    47
import java.util.function.Function;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    48
import java.util.regex.*;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    49
import java.util.Random;
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
    50
import java.util.Scanner;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    51
import java.io.*;
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
    52
import java.nio.file.*;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    53
import java.util.*;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    54
import java.nio.CharBuffer;
17447
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
    55
import java.util.function.Predicate;
45288
58be10a068c2 8180805: move RandomFactory to the top level testlibrary
iignatyev
parents: 44122
diff changeset
    56
import jdk.test.lib.RandomFactory;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    57
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    58
/**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    59
 * This is a test class created to check the operation of
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    60
 * the Pattern and Matcher classes.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    61
 */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    62
public class RegExTest {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    63
30370
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    64
    private static Random generator = RandomFactory.getRandom();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    65
    private static boolean failure = false;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    66
    private static int failCount = 0;
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
    67
    private static String firstFailure = null;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    68
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    69
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    70
     * Main to interpret arguments and run several tests.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    71
     *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    72
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    73
    public static void main(String[] args) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    74
        // Most of the tests are in a file
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    75
        processFile("TestCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    76
        //processFile("PerlCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    77
        processFile("BMPTestCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    78
        processFile("SupplementaryTestCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    79
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    80
        // These test many randomly generated char patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    81
        bm();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    82
        slice();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    83
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    84
        // These are hard to put into the file
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    85
        escapes();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    86
        blankInput();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    87
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    88
        // Substitition tests on randomly generated sequences
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    89
        globalSubstitute();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    90
        stringbufferSubstitute();
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
    91
        stringbuilderSubstitute();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
    92
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    93
        substitutionBasher();
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
    94
        substitutionBasher2();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    95
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    96
        // Canonical Equivalence
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    97
        ceTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    98
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    99
        // Anchors
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   100
        anchorTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   101
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   102
        // boolean match calls
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   103
        matchesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   104
        lookingAtTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   105
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   106
        // Pattern API
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   107
        patternMatchesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   108
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   109
        // Misc
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   110
        lookbehindTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   111
        nullArgumentTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   112
        backRefTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   113
        groupCaptureTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   114
        caretTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   115
        charClassTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   116
        emptyPatternTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   117
        findIntTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   118
        group0Test();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   119
        longPatternTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   120
        octalTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   121
        ampersandTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   122
        negationTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   123
        splitTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   124
        appendTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   125
        caseFoldingTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   126
        commentsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   127
        unixLinesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   128
        replaceFirstTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   129
        gTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   130
        zTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   131
        serializeTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   132
        reluctantRepetitionTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   133
        multilineDollarTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   134
        dollarAtEndTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   135
        caretBetweenTerminatorsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   136
        // This RFE rejected in Tiger numOccurrencesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   137
        javaCharClassTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   138
        nonCaptureRepetitionTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   139
        notCapturedGroupCurlyMatchTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   140
        escapedSegmentTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   141
        literalPatternTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   142
        literalReplacementTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   143
        regionTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   144
        toStringTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   145
        negatedCharClassTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   146
        findFromTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   147
        boundsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   148
        unicodeWordBoundsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   149
        caretAtEndTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   150
        wordSearchTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   151
        hitEndTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   152
        toMatchResultTest();
29503
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   153
        toMatchResultTest2();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   154
        surrogatesInClassTest();
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   155
        removeQEQuotingTest();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   156
        namedGroupCaptureTest();
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
   157
        nonBmpClassComplementTest();
5610
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
   158
        unicodePropertiesTest();
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   159
        unicodeHexNotationTest();
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
   160
        unicodeClassesTest();
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
   161
        unicodeCharacterNameTest();
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   162
        horizontalAndVerticalWSTest();
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   163
        linebreakTest();
13554
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
   164
        branchTest();
17183
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
   165
        groupCurlyNotFoundSuppTest();
19604
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
   166
        groupCurlyBackoffTest();
17447
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
   167
        patternAsPredicate();
49763
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
   168
        patternAsMatchPredicate();
25523
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
   169
        invalidFlags();
38777
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
   170
        embeddedFlags();
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
   171
        grapheme();
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
   172
        expoBacktracking();
48853
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
   173
        invalidGroupName();
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
   174
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   175
        if (failure) {
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   176
            throw new
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   177
                RuntimeException("RegExTest failed, 1st failure: " +
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   178
                                 firstFailure);
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   179
        } else {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   180
            System.err.println("OKAY: All tests passed.");
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   181
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   182
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   183
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   184
    // Utility functions
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   185
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   186
    private static String getRandomAlphaString(int length) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   187
        StringBuffer buf = new StringBuffer(length);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   188
        for (int i=0; i<length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   189
            char randChar = (char)(97 + generator.nextInt(26));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   190
            buf.append(randChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   191
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   192
        return buf.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   193
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   194
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   195
    private static void check(Matcher m, String expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   196
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   197
        if (!m.group().equals(expected))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   198
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   199
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   200
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   201
    private static void check(Matcher m, String result, boolean expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   202
        m.find();
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   203
        if (m.group().equals(result) != expected)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   204
            failCount++;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   205
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   206
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   207
    private static void check(Pattern p, String s, boolean expected) {
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   208
        if (p.matcher(s).find() != expected)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   209
            failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   210
    }
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   211
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   212
    private static void check(String p, String s, boolean expected) {
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   213
        Matcher matcher = Pattern.compile(p).matcher(s);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   214
        if (matcher.find() != expected)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   215
            failCount++;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   216
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   217
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   218
    private static void check(String p, char c, boolean expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   219
        String propertyPattern = expected ? "\\p" + p : "\\P" + p;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   220
        Pattern pattern = Pattern.compile(propertyPattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   221
        char[] ca = new char[1]; ca[0] = c;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   222
        Matcher matcher = pattern.matcher(new String(ca));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   223
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   224
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   225
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   226
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   227
    private static void check(String p, int codePoint, boolean expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   228
        String propertyPattern = expected ? "\\p" + p : "\\P" + p;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   229
        Pattern pattern = Pattern.compile(propertyPattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   230
        char[] ca = Character.toChars(codePoint);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   231
        Matcher matcher = pattern.matcher(new String(ca));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   232
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   233
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   234
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   235
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   236
    private static void check(String p, int flag, String input, String s,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   237
                              boolean expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   238
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   239
        Pattern pattern = Pattern.compile(p, flag);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   240
        Matcher matcher = pattern.matcher(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   241
        if (expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   242
            check(matcher, s, expected);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   243
        else
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   244
            check(pattern, input, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   245
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   246
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   247
    private static void report(String testName) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   248
        int spacesToAdd = 30 - testName.length();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   249
        StringBuffer paddedNameBuffer = new StringBuffer(testName);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   250
        for (int i=0; i<spacesToAdd; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   251
            paddedNameBuffer.append(" ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   252
        String paddedName = paddedNameBuffer.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   253
        System.err.println(paddedName + ": " +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   254
                           (failCount==0 ? "Passed":"Failed("+failCount+")"));
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   255
        if (failCount > 0) {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   256
            failure = true;
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   257
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   258
            if (firstFailure == null) {
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   259
                firstFailure = testName;
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   260
            }
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   261
        }
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   262
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   263
        failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   264
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   265
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   266
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   267
     * Converts ASCII alphabet characters [A-Za-z] in the given 's' to
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   268
     * supplementary characters. This method does NOT fully take care
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   269
     * of the regex syntax.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   270
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   271
    private static String toSupplementaries(String s) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   272
        int length = s.length();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   273
        StringBuffer sb = new StringBuffer(length * 2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   274
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   275
        for (int i = 0; i < length; ) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   276
            char c = s.charAt(i++);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   277
            if (c == '\\') {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   278
                sb.append(c);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   279
                if (i < length) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   280
                    c = s.charAt(i++);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   281
                    sb.append(c);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   282
                    if (c == 'u') {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   283
                        // assume no syntax error
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   284
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   285
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   286
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   287
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   288
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   289
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   290
            } else if ((c >= 'A' && c <= 'Z') || (c >= 'a' && c <= 'z')) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   291
                sb.append('\ud800').append((char)('\udc00'+c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   292
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   293
                sb.append(c);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   294
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   295
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   296
        return sb.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   297
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   298
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   299
    // Regular expression tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   300
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   301
    // This is for bug 6178785
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   302
    // Test if an expected NPE gets thrown when passing in a null argument
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   303
    private static boolean check(Runnable test) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   304
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   305
            test.run();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   306
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   307
            return false;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   308
        } catch (NullPointerException npe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   309
            return true;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   310
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   311
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   312
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   313
    private static void nullArgumentTest() {
29243
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   314
        check(() -> Pattern.compile(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   315
        check(() -> Pattern.matches(null, null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   316
        check(() -> Pattern.matches("xyz", null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   317
        check(() -> Pattern.quote(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   318
        check(() -> Pattern.compile("xyz").split(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   319
        check(() -> Pattern.compile("xyz").matcher(null));
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   320
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   321
        final Matcher m = Pattern.compile("xyz").matcher("xyz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   322
        m.matches();
29243
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   323
        check(() -> m.appendTail((StringBuffer) null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   324
        check(() -> m.appendTail((StringBuilder)null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   325
        check(() -> m.replaceAll((String) null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   326
        check(() -> m.replaceAll((Function<MatchResult, String>)null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   327
        check(() -> m.replaceFirst((String)null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   328
        check(() -> m.replaceFirst((Function<MatchResult, String>) null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   329
        check(() -> m.appendReplacement((StringBuffer)null, null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   330
        check(() -> m.appendReplacement((StringBuilder)null, null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   331
        check(() -> m.reset(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   332
        check(() -> Matcher.quoteReplacement(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   333
        //check(() -> m.usePattern(null));
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   334
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   335
        report("Null Argument");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   336
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   337
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   338
    // This is for bug6635133
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   339
    // Test if surrogate pair in Unicode escapes can be handled correctly.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   340
    private static void surrogatesInClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   341
        Pattern pattern = Pattern.compile("[\\ud834\\udd21-\\ud834\\udd24]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   342
        Matcher matcher = pattern.matcher("\ud834\udd22");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   343
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   344
            failCount++;
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   345
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   346
        report("Surrogate pair in Unicode escape");
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   347
    }
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   348
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   349
    // This is for bug6990617
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   350
    // Test if Pattern.RemoveQEQuoting works correctly if the octal unicode
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   351
    // char encoding is only 2 or 3 digits instead of 4 and the first quoted
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   352
    // char is an octal digit.
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   353
    private static void removeQEQuotingTest() throws Exception {
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   354
        Pattern pattern =
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   355
            Pattern.compile("\\011\\Q1sometext\\E\\011\\Q2sometext\\E");
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   356
        Matcher matcher = pattern.matcher("\t1sometext\t2sometext");
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   357
        if (!matcher.find())
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   358
            failCount++;
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   359
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   360
        report("Remove Q/E Quoting");
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   361
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   362
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   363
    // This is for bug 4988891
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   364
    // Test toMatchResult to see that it is a copy of the Matcher
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   365
    // that is not affected by subsequent operations on the original
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   366
    private static void toMatchResultTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   367
        Pattern pattern = Pattern.compile("squid");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   368
        Matcher matcher = pattern.matcher(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   369
            "agiantsquidofdestinyasmallsquidoffate");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   370
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   371
        int matcherStart1 = matcher.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   372
        MatchResult mr = matcher.toMatchResult();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   373
        if (mr == matcher)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   374
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   375
        int resultStart1 = mr.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   376
        if (matcherStart1 != resultStart1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   377
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   378
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   379
        int matcherStart2 = matcher.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   380
        int resultStart2 = mr.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   381
        if (matcherStart2 == resultStart2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   382
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   383
        if (resultStart1 != resultStart2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   384
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   385
        MatchResult mr2 = matcher.toMatchResult();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   386
        if (mr == mr2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   387
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   388
        if (mr2.start() != matcherStart2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   389
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   390
        report("toMatchResult is a copy");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   391
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   392
29503
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   393
    private static void checkExpectedISE(Runnable test) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   394
        try {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   395
            test.run();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   396
            failCount++;
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   397
        } catch (IllegalStateException x) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   398
        } catch (IndexOutOfBoundsException xx) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   399
            failCount++;
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   400
        }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   401
    }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   402
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   403
    private static void checkExpectedIOOE(Runnable test) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   404
        try {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   405
            test.run();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   406
            failCount++;
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   407
        } catch (IndexOutOfBoundsException x) {}
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   408
    }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   409
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   410
    // This is for bug 8074678
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   411
    // Test the result of toMatchResult throws ISE if no match is availble
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   412
    private static void toMatchResultTest2() throws Exception {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   413
        Matcher matcher = Pattern.compile("nomatch").matcher("hello world");
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   414
        matcher.find();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   415
        MatchResult mr = matcher.toMatchResult();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   416
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   417
        checkExpectedISE(() -> mr.start());
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   418
        checkExpectedISE(() -> mr.start(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   419
        checkExpectedISE(() -> mr.end());
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   420
        checkExpectedISE(() -> mr.end(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   421
        checkExpectedISE(() -> mr.group());
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   422
        checkExpectedISE(() -> mr.group(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   423
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   424
        matcher = Pattern.compile("(match)").matcher("there is a match");
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   425
        matcher.find();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   426
        MatchResult mr2 = matcher.toMatchResult();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   427
        checkExpectedIOOE(() -> mr2.start(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   428
        checkExpectedIOOE(() -> mr2.end(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   429
        checkExpectedIOOE(() -> mr2.group(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   430
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   431
        report("toMatchResult2 appropriate exceptions");
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   432
    }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   433
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   434
    // This is for bug 5013885
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   435
    // Must test a slice to see if it reports hitEnd correctly
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   436
    private static void hitEndTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   437
        // Basic test of Slice node
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   438
        Pattern p = Pattern.compile("^squidattack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   439
        Matcher m = p.matcher("squack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   440
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   441
        if (m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   442
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   443
        m.reset("squid");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   444
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   445
        if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   446
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   447
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   448
        // Test Slice, SliceA and SliceU nodes
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   449
        for (int i=0; i<3; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   450
            int flags = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   451
            if (i==1) flags = Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   452
            if (i==2) flags = Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   453
            p = Pattern.compile("^abc", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   454
            m = p.matcher("ad");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   455
            m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   456
            if (m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   457
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   458
            m.reset("ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   459
            m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   460
            if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   461
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   462
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   463
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   464
        // Test Boyer-Moore node
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   465
        p = Pattern.compile("catattack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   466
        m = p.matcher("attack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   467
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   468
        if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   469
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   470
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   471
        p = Pattern.compile("catattack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   472
        m = p.matcher("attackattackattackcatatta");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   473
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   474
        if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   475
            failCount++;
45888
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   476
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   477
        // 8184706: Matching u+0d at EOL against \R should hit-end
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   478
        p = Pattern.compile("...\\R");
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   479
        m = p.matcher("cat" + (char)0x0a);
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   480
        m.find();
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   481
        if (m.hitEnd())
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   482
            failCount++;
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   483
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   484
        m = p.matcher("cat" + (char)0x0d);
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   485
        m.find();
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   486
        if (!m.hitEnd())
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   487
            failCount++;
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   488
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   489
        m = p.matcher("cat" + (char)0x0d + (char)0x0a);
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   490
        m.find();
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   491
        if (m.hitEnd())
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   492
            failCount++;
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   493
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   494
        report("hitEnd");
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   495
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   496
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   497
    // This is for bug 4997476
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   498
    // It is weird code submitted by customer demonstrating a regression
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   499
    private static void wordSearchTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   500
        String testString = new String("word1 word2 word3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   501
        Pattern p = Pattern.compile("\\b");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   502
        Matcher m = p.matcher(testString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   503
        int position = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   504
        int start = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   505
        while (m.find(position)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   506
            start = m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   507
            if (start == testString.length())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   508
                break;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   509
            if (m.find(start+1)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   510
                position = m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   511
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   512
                position = testString.length();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   513
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   514
            if (testString.substring(start, position).equals(" "))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   515
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   516
            if (!testString.substring(start, position-1).startsWith("word"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   517
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   518
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   519
        report("Customer word search");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   520
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   521
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   522
    // This is for bug 4994840
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   523
    private static void caretAtEndTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   524
        // Problem only occurs with multiline patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   525
        // containing a beginning-of-line caret "^" followed
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   526
        // by an expression that also matches the empty string.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   527
        Pattern pattern = Pattern.compile("^x?", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   528
        Matcher matcher = pattern.matcher("\r");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   529
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   530
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   531
        report("Caret at end");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   532
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   533
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   534
    // This test is for 4979006
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   535
    // Check to see if word boundary construct properly handles unicode
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   536
    // non spacing marks
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   537
    private static void unicodeWordBoundsTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   538
        String spaces = "  ";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   539
        String wordChar = "a";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   540
        String nsm = "\u030a";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   541
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   542
        assert (Character.getType('\u030a') == Character.NON_SPACING_MARK);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   543
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   544
        Pattern pattern = Pattern.compile("\\b");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   545
        Matcher matcher = pattern.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   546
        // S=other B=word character N=non spacing mark .=word boundary
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   547
        // SS.BB.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   548
        String input = spaces + wordChar + wordChar + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   549
        twoFindIndexes(input, matcher, 2, 4);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   550
        // SS.BBN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   551
        input = spaces + wordChar +wordChar + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   552
        twoFindIndexes(input, matcher, 2, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   553
        // SS.BN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   554
        input = spaces + wordChar + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   555
        twoFindIndexes(input, matcher, 2, 4);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   556
        // SS.BNN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   557
        input = spaces + wordChar + nsm + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   558
        twoFindIndexes(input, matcher, 2, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   559
        // SSN.BB.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   560
        input = spaces + nsm + wordChar + wordChar + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   561
        twoFindIndexes(input, matcher, 3, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   562
        // SS.BNB.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   563
        input = spaces + wordChar + nsm + wordChar + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   564
        twoFindIndexes(input, matcher, 2, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   565
        // SSNNSS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   566
        input = spaces + nsm + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   567
        matcher.reset(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   568
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   569
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   570
        // SSN.BBN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   571
        input = spaces + nsm + wordChar + wordChar + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   572
        twoFindIndexes(input, matcher, 3, 6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   573
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   574
        report("Unicode word boundary");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   575
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   576
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   577
    private static void twoFindIndexes(String input, Matcher matcher, int a,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   578
                                       int b) throws Exception
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   579
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   580
        matcher.reset(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   581
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   582
        if (matcher.start() != a)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   583
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   584
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   585
        if (matcher.start() != b)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   586
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   587
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   588
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   589
    // This test is for 6284152
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   590
    static void check(String regex, String input, String[] expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   591
        List<String> result = new ArrayList<String>();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   592
        Pattern p = Pattern.compile(regex);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   593
        Matcher m = p.matcher(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   594
        while (m.find()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   595
            result.add(m.group());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   596
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   597
        if (!Arrays.asList(expected).equals(result))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   598
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   599
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   600
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   601
    private static void lookbehindTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   602
        //Positive
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   603
        check("(?<=%.{0,5})foo\\d",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   604
              "%foo1\n%bar foo2\n%bar  foo3\n%blahblah foo4\nfoo5",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   605
              new String[]{"foo1", "foo2", "foo3"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   606
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   607
        //boundary at end of the lookbehind sub-regex should work consistently
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   608
        //with the boundary just after the lookbehind sub-regex
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   609
        check("(?<=.*\\b)foo", "abcd foo", new String[]{"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   610
        check("(?<=.*)\\bfoo", "abcd foo", new String[]{"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   611
        check("(?<!abc )\\bfoo", "abc foo", new String[0]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   612
        check("(?<!abc \\b)foo", "abc foo", new String[0]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   613
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   614
        //Negative
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   615
        check("(?<!%.{0,5})foo\\d",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   616
              "%foo1\n%bar foo2\n%bar  foo3\n%blahblah foo4\nfoo5",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   617
              new String[] {"foo4", "foo5"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   618
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   619
        //Positive greedy
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   620
        check("(?<=%b{1,4})foo", "%bbbbfoo", new String[] {"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   621
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   622
        //Positive reluctant
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   623
        check("(?<=%b{1,4}?)foo", "%bbbbfoo", new String[] {"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   624
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   625
        //supplementary
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   626
        check("(?<=%b{1,4})fo\ud800\udc00o", "%bbbbfo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   627
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   628
        check("(?<=%b{1,4}?)fo\ud800\udc00o", "%bbbbfo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   629
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   630
        check("(?<!%b{1,4})fo\ud800\udc00o", "%afo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   631
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   632
        check("(?<!%b{1,4}?)fo\ud800\udc00o", "%afo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   633
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   634
        report("Lookbehind");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   635
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   636
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   637
    // This test is for 4938995
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   638
    // Check to see if weak region boundaries are transparent to
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   639
    // lookahead and lookbehind constructs
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   640
    private static void boundsTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   641
        String fullMessage = "catdogcat";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   642
        Pattern pattern = Pattern.compile("(?<=cat)dog(?=cat)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   643
        Matcher matcher = pattern.matcher("catdogca");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   644
        matcher.useTransparentBounds(true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   645
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   646
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   647
        matcher.reset("atdogcat");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   648
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   649
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   650
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   651
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   652
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   653
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   654
        matcher.region(0,9);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   655
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   656
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   657
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   658
        matcher.region(0,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   659
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   660
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   661
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   662
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   663
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   664
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   665
        matcher.useTransparentBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   666
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   667
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   668
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   669
        // Negative lookahead/lookbehind
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   670
        pattern = Pattern.compile("(?<!cat)dog(?!cat)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   671
        matcher = pattern.matcher("dogcat");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   672
        matcher.useTransparentBounds(true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   673
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   674
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   675
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   676
        matcher.reset("catdog");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   677
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   678
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   679
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   680
        matcher.useTransparentBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   681
        matcher.reset("dogcat");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   682
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   683
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   684
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   685
        matcher.reset("catdog");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   686
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   687
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   688
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   689
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   690
        report("Region bounds transparency");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   691
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   692
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   693
    // This test is for 4945394
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   694
    private static void findFromTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   695
        String message = "This is 40 $0 message.";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   696
        Pattern pat = Pattern.compile("\\$0");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   697
        Matcher match = pat.matcher(message);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   698
        if (!match.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   699
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   700
        if (match.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   701
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   702
        if (match.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   703
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   704
        report("Check for alternating find");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   705
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   706
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   707
    // This test is for 4872664 and 4892980
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   708
    private static void negatedCharClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   709
        Pattern pattern = Pattern.compile("[^>]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   710
        Matcher matcher = pattern.matcher("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   711
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   712
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   713
        pattern = Pattern.compile("[^fr]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   714
        matcher = pattern.matcher("a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   715
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   716
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   717
        matcher.reset("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   718
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   719
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   720
        String s = "for";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   721
        String result[] = s.split("[^fr]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   722
        if (!result[0].equals("f"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   723
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   724
        if (!result[1].equals("r"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   725
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   726
        s = "f\u203Ar";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   727
        result = s.split("[^fr]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   728
        if (!result[0].equals("f"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   729
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   730
        if (!result[1].equals("r"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   731
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   732
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   733
        // Test adding to bits, subtracting a node, then adding to bits again
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   734
        pattern = Pattern.compile("[^f\u203Ar]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   735
        matcher = pattern.matcher("a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   736
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   737
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   738
        matcher.reset("f");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   739
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   740
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   741
        matcher.reset("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   742
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   743
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   744
        matcher.reset("r");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   745
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   746
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   747
        matcher.reset("\u203B");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   748
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   749
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   750
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   751
        // Test subtracting a node, adding to bits, subtracting again
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   752
        pattern = Pattern.compile("[^\u203Ar\u203B]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   753
        matcher = pattern.matcher("a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   754
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   755
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   756
        matcher.reset("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   757
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   758
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   759
        matcher.reset("r");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   760
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   761
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   762
        matcher.reset("\u203B");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   763
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   764
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   765
        matcher.reset("\u203C");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   766
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   767
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   768
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   769
        report("Negated Character Class");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   770
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   771
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   772
    // This test is for 4628291
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   773
    private static void toStringTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   774
        Pattern pattern = Pattern.compile("b+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   775
        if (pattern.toString() != "b+")
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   776
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   777
        Matcher matcher = pattern.matcher("aaabbbccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   778
        String matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   779
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   780
        matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   781
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   782
        matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   783
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   784
        matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   785
        report("toString");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   786
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   787
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   788
    // This test is for 4808962
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   789
    private static void literalPatternTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   790
        int flags = Pattern.LITERAL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   791
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   792
        Pattern pattern = Pattern.compile("abc\\t$^", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   793
        check(pattern, "abc\\t$^", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   794
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   795
        pattern = Pattern.compile(Pattern.quote("abc\\t$^"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   796
        check(pattern, "abc\\t$^", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   797
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   798
        pattern = Pattern.compile("\\Qa^$bcabc\\E", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   799
        check(pattern, "\\Qa^$bcabc\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   800
        check(pattern, "a^$bcabc", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   801
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   802
        pattern = Pattern.compile("\\\\Q\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   803
        check(pattern, "\\Q\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   804
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   805
        pattern = Pattern.compile("\\Qabc\\Eefg\\\\Q\\\\Ehij");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   806
        check(pattern, "abcefg\\Q\\Ehij", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   807
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   808
        pattern = Pattern.compile("\\\\\\Q\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   809
        check(pattern, "\\\\\\\\", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   810
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   811
        pattern = Pattern.compile(Pattern.quote("\\Qa^$bcabc\\E"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   812
        check(pattern, "\\Qa^$bcabc\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   813
        check(pattern, "a^$bcabc", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   814
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   815
        pattern = Pattern.compile(Pattern.quote("\\Qabc\\Edef"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   816
        check(pattern, "\\Qabc\\Edef", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   817
        check(pattern, "abcdef", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   818
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   819
        pattern = Pattern.compile(Pattern.quote("abc\\Edef"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   820
        check(pattern, "abc\\Edef", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   821
        check(pattern, "abcdef", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   822
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   823
        pattern = Pattern.compile(Pattern.quote("\\E"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   824
        check(pattern, "\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   825
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   826
        pattern = Pattern.compile("((((abc.+?:)", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   827
        check(pattern, "((((abc.+?:)", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   828
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   829
        flags |= Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   830
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   831
        pattern = Pattern.compile("^cat$", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   832
        check(pattern, "abc^cat$def", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   833
        check(pattern, "cat", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   834
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   835
        flags |= Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   836
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   837
        pattern = Pattern.compile("abcdef", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   838
        check(pattern, "ABCDEF", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   839
        check(pattern, "AbCdEf", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   840
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   841
        flags |= Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   842
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   843
        pattern = Pattern.compile("a...b", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   844
        check(pattern, "A...b", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   845
        check(pattern, "Axxxb", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   846
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   847
        flags |= Pattern.CANON_EQ;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   848
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   849
        Pattern p = Pattern.compile("testa\u030a", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   850
        check(pattern, "testa\u030a", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   851
        check(pattern, "test\u00e5", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   852
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   853
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   854
        flags = Pattern.LITERAL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   855
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   856
        pattern = Pattern.compile(toSupplementaries("abc\\t$^"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   857
        check(pattern, toSupplementaries("abc\\t$^"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   858
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   859
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("abc\\t$^")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   860
        check(pattern, toSupplementaries("abc\\t$^"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   861
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   862
        pattern = Pattern.compile(toSupplementaries("\\Qa^$bcabc\\E"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   863
        check(pattern, toSupplementaries("\\Qa^$bcabc\\E"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   864
        check(pattern, toSupplementaries("a^$bcabc"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   865
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   866
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("\\Qa^$bcabc\\E")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   867
        check(pattern, toSupplementaries("\\Qa^$bcabc\\E"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   868
        check(pattern, toSupplementaries("a^$bcabc"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   869
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   870
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("\\Qabc\\Edef")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   871
        check(pattern, toSupplementaries("\\Qabc\\Edef"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   872
        check(pattern, toSupplementaries("abcdef"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   873
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   874
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("abc\\Edef")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   875
        check(pattern, toSupplementaries("abc\\Edef"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   876
        check(pattern, toSupplementaries("abcdef"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   877
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   878
        pattern = Pattern.compile(toSupplementaries("((((abc.+?:)"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   879
        check(pattern, toSupplementaries("((((abc.+?:)"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   880
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   881
        flags |= Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   882
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   883
        pattern = Pattern.compile(toSupplementaries("^cat$"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   884
        check(pattern, toSupplementaries("abc^cat$def"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   885
        check(pattern, toSupplementaries("cat"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   886
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   887
        flags |= Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   888
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   889
        // note: this is case-sensitive.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   890
        pattern = Pattern.compile(toSupplementaries("a...b"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   891
        check(pattern, toSupplementaries("a...b"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   892
        check(pattern, toSupplementaries("axxxb"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   893
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   894
        flags |= Pattern.CANON_EQ;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   895
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   896
        String t = toSupplementaries("test");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   897
        p = Pattern.compile(t + "a\u030a", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   898
        check(pattern, t + "a\u030a", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   899
        check(pattern, t + "\u00e5", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   900
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   901
        report("Literal pattern");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   902
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   903
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   904
    // This test is for 4803179
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   905
    // This test is also for 4808962, replacement parts
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   906
    private static void literalReplacementTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   907
        int flags = Pattern.LITERAL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   908
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   909
        Pattern pattern = Pattern.compile("abc", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   910
        Matcher matcher = pattern.matcher("zzzabczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   911
        String replaceTest = "$0";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   912
        String result = matcher.replaceAll(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   913
        if (!result.equals("zzzabczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   914
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   915
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   916
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   917
        String literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   918
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   919
        if (!result.equals("zzz$0zzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   920
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   921
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   922
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   923
        replaceTest = "\\t$\\$";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   924
        literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   925
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   926
        if (!result.equals("zzz\\t$\\$zzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   927
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   928
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   929
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   930
        pattern = Pattern.compile(toSupplementaries("abc"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   931
        matcher = pattern.matcher(toSupplementaries("zzzabczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   932
        replaceTest = "$0";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   933
        result = matcher.replaceAll(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   934
        if (!result.equals(toSupplementaries("zzzabczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   935
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   936
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   937
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   938
        literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   939
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   940
        if (!result.equals(toSupplementaries("zzz$0zzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   941
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   942
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   943
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   944
        replaceTest = "\\t$\\$";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   945
        literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   946
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   947
        if (!result.equals(toSupplementaries("zzz\\t$\\$zzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   948
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   949
12432
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   950
        // IAE should be thrown if backslash or '$' is the last character
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   951
        // in replacement string
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   952
        try {
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   953
            "\uac00".replaceAll("\uac00", "$");
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   954
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   955
        } catch (IllegalArgumentException iie) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   956
        } catch (Exception e) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   957
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   958
        }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   959
        try {
12432
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   960
            "\uac00".replaceAll("\uac00", "\\");
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   961
            failCount++;
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   962
        } catch (IllegalArgumentException iie) {
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   963
        } catch (Exception e) {
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   964
            failCount++;
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   965
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   966
        report("Literal replacement");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   967
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   968
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   969
    // This test is for 4757029
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   970
    private static void regionTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   971
        Pattern pattern = Pattern.compile("abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   972
        Matcher matcher = pattern.matcher("abcdefabc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   973
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   974
        matcher.region(0,9);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   975
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   976
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   977
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   978
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   979
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   980
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   981
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   982
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   983
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   984
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   985
        matcher.region(0,2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   986
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   987
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   988
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   989
        expectRegionFail(matcher, 1, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   990
        expectRegionFail(matcher, -1, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   991
        expectRegionFail(matcher, -1, 1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   992
        expectRegionFail(matcher, 5, 3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   993
        expectRegionFail(matcher, 5, 12);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   994
        expectRegionFail(matcher, 12, 12);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   995
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   996
        pattern = Pattern.compile("^abc$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   997
        matcher = pattern.matcher("zzzabczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   998
        matcher.region(0,9);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   999
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1000
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1001
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1002
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1003
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1004
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1005
        matcher.useAnchoringBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1006
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1007
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1008
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1009
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1010
        pattern = Pattern.compile(toSupplementaries("abc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1011
        matcher = pattern.matcher(toSupplementaries("abcdefabc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1012
        matcher.region(0,9*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1013
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1014
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1015
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1016
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1017
        matcher.region(0,3*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1018
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1019
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1020
        matcher.region(1,3*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1021
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1022
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1023
        matcher.region(3*2,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1024
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1025
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1026
        matcher.region(0,2*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1027
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1028
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1029
        matcher.region(0,2*2+1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1030
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1031
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1032
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1033
        expectRegionFail(matcher, 1*2, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1034
        expectRegionFail(matcher, -1, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1035
        expectRegionFail(matcher, -1, 1*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1036
        expectRegionFail(matcher, 5*2, 3*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1037
        expectRegionFail(matcher, 5*2, 12*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1038
        expectRegionFail(matcher, 12*2, 12*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1039
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1040
        pattern = Pattern.compile(toSupplementaries("^abc$"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1041
        matcher = pattern.matcher(toSupplementaries("zzzabczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1042
        matcher.region(0,9*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1043
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1044
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1045
        matcher.region(3*2,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1046
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1047
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1048
        matcher.region(3*2+1,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1049
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1050
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1051
        matcher.region(3*2,6*2-1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1052
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1053
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1054
        matcher.region(3*2,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1055
        matcher.useAnchoringBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1056
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1057
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1058
        report("Regions");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1059
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1060
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1061
    private static void expectRegionFail(Matcher matcher, int index1,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1062
                                         int index2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1063
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1064
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1065
            matcher.region(index1, index2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1066
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1067
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1068
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1069
        } catch (IllegalStateException ise) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1070
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1071
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1072
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1073
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1074
    // This test is for 4803197
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1075
    private static void escapedSegmentTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1076
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1077
        Pattern pattern = Pattern.compile("\\Qdir1\\dir2\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1078
        check(pattern, "dir1\\dir2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1079
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1080
        pattern = Pattern.compile("\\Qdir1\\dir2\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1081
        check(pattern, "dir1\\dir2\\", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1082
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1083
        pattern = Pattern.compile("(\\Qdir1\\dir2\\\\E)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1084
        check(pattern, "dir1\\dir2\\", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1085
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1086
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1087
        pattern = Pattern.compile(toSupplementaries("\\Qdir1\\dir2\\E"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1088
        check(pattern, toSupplementaries("dir1\\dir2"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1089
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1090
        pattern = Pattern.compile(toSupplementaries("\\Qdir1\\dir2")+"\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1091
        check(pattern, toSupplementaries("dir1\\dir2\\"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1092
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1093
        pattern = Pattern.compile(toSupplementaries("(\\Qdir1\\dir2")+"\\\\E)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1094
        check(pattern, toSupplementaries("dir1\\dir2\\"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1095
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1096
        report("Escaped segment");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1097
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1098
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1099
    // This test is for 4792284
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1100
    private static void nonCaptureRepetitionTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1101
        String input = "abcdefgh;";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1102
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1103
        String[] patterns = new String[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1104
            "(?:\\w{4})+;",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1105
            "(?:\\w{8})*;",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1106
            "(?:\\w{2}){2,4};",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1107
            "(?:\\w{4}){2,};",   // only matches the
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1108
            ".*?(?:\\w{5})+;",   //     specified minimum
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1109
            ".*?(?:\\w{9})*;",   //     number of reps - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1110
            "(?:\\w{4})+?;",     // lazy repetition - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1111
            "(?:\\w{4})++;",     // possessive repetition - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1112
            "(?:\\w{2,}?)+;",    // non-deterministic - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1113
            "(\\w{4})+;",        // capturing group - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1114
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1115
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1116
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1117
            // Check find()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1118
            check(patterns[i], 0, input, input, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1119
            // Check matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1120
            Pattern p = Pattern.compile(patterns[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1121
            Matcher m = p.matcher(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1122
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1123
            if (m.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1124
                if (!m.group(0).equals(input))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1125
                    failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1126
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1127
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1128
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1129
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1131
        report("Non capturing repetition");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1132
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1133
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1134
    // This test is for 6358731
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1135
    private static void notCapturedGroupCurlyMatchTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1136
        Pattern pattern = Pattern.compile("(abc)+|(abcd)+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1137
        Matcher matcher = pattern.matcher("abcd");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1138
        if (!matcher.matches() ||
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1139
             matcher.group(1) != null ||
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1140
             !matcher.group(2).equals("abcd")) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1141
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1142
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1143
        report("Not captured GroupCurly");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1144
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1145
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1146
    // This test is for 4706545
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1147
    private static void javaCharClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1148
        for (int i=0; i<1000; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1149
            char c = (char)generator.nextInt();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1150
            check("{javaLowerCase}", c, Character.isLowerCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1151
            check("{javaUpperCase}", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1152
            check("{javaUpperCase}+", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1153
            check("{javaTitleCase}", c, Character.isTitleCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1154
            check("{javaDigit}", c, Character.isDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1155
            check("{javaDefined}", c, Character.isDefined(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1156
            check("{javaLetter}", c, Character.isLetter(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1157
            check("{javaLetterOrDigit}", c, Character.isLetterOrDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1158
            check("{javaJavaIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1159
                  Character.isJavaIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1160
            check("{javaJavaIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1161
                  Character.isJavaIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1162
            check("{javaUnicodeIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1163
                  Character.isUnicodeIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1164
            check("{javaUnicodeIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1165
                  Character.isUnicodeIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1166
            check("{javaIdentifierIgnorable}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1167
                  Character.isIdentifierIgnorable(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1168
            check("{javaSpaceChar}", c, Character.isSpaceChar(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1169
            check("{javaWhitespace}", c, Character.isWhitespace(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1170
            check("{javaISOControl}", c, Character.isISOControl(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1171
            check("{javaMirrored}", c, Character.isMirrored(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1172
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1173
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1174
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1175
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1176
        for (int i=0; i<1000; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1177
            int c = generator.nextInt(Character.MAX_CODE_POINT
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1178
                                      - Character.MIN_SUPPLEMENTARY_CODE_POINT)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1179
                        + Character.MIN_SUPPLEMENTARY_CODE_POINT;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1180
            check("{javaLowerCase}", c, Character.isLowerCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1181
            check("{javaUpperCase}", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1182
            check("{javaUpperCase}+", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1183
            check("{javaTitleCase}", c, Character.isTitleCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1184
            check("{javaDigit}", c, Character.isDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1185
            check("{javaDefined}", c, Character.isDefined(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1186
            check("{javaLetter}", c, Character.isLetter(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1187
            check("{javaLetterOrDigit}", c, Character.isLetterOrDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1188
            check("{javaJavaIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1189
                  Character.isJavaIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1190
            check("{javaJavaIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1191
                  Character.isJavaIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1192
            check("{javaUnicodeIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1193
                  Character.isUnicodeIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1194
            check("{javaUnicodeIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1195
                  Character.isUnicodeIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1196
            check("{javaIdentifierIgnorable}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1197
                  Character.isIdentifierIgnorable(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1198
            check("{javaSpaceChar}", c, Character.isSpaceChar(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1199
            check("{javaWhitespace}", c, Character.isWhitespace(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1200
            check("{javaISOControl}", c, Character.isISOControl(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1201
            check("{javaMirrored}", c, Character.isMirrored(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1202
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1203
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1204
        report("Java character classes");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1205
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1206
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1207
    // This test is for 4523620
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1208
    /*
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1209
    private static void numOccurrencesTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1210
        Pattern pattern = Pattern.compile("aaa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1211
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1212
        if (pattern.numOccurrences("aaaaaa", false) != 2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1213
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1214
        if (pattern.numOccurrences("aaaaaa", true) != 4)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1215
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1216
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1217
        pattern = Pattern.compile("^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1218
        if (pattern.numOccurrences("aaaaaa", false) != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1219
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1220
        if (pattern.numOccurrences("aaaaaa", true) != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1221
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1222
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1223
        report("Number of Occurrences");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1224
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1225
    */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1226
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1227
    // This test is for 4776374
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1228
    private static void caretBetweenTerminatorsTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1229
        int flags1 = Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1230
        int flags2 = Pattern.DOTALL | Pattern.UNIX_LINES;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1231
        int flags3 = Pattern.DOTALL | Pattern.UNIX_LINES | Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1232
        int flags4 = Pattern.DOTALL | Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1233
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1234
        check("^....", flags1, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1235
        check(".....^", flags1, "test\ntest", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1236
        check(".....^", flags1, "test\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1237
        check("....^", flags1, "test\r\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1238
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1239
        check("^....", flags2, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1240
        check("....^", flags2, "test\ntest", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1241
        check(".....^", flags2, "test\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1242
        check("....^", flags2, "test\r\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1243
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1244
        check("^....", flags3, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1245
        check(".....^", flags3, "test\ntest", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1246
        check(".....^", flags3, "test\u0085test", "test\u0085", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1247
        check(".....^", flags3, "test\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1248
        check(".....^", flags3, "test\r\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1249
        check("......^", flags3, "test\r\ntest", "test\r\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1250
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1251
        check("^....", flags4, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1252
        check(".....^", flags3, "test\ntest", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1253
        check(".....^", flags4, "test\u0085test", "test\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1254
        check(".....^", flags4, "test\n", "test\n", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1255
        check(".....^", flags4, "test\r\n", "test\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1256
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1257
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1258
        String t = toSupplementaries("test");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1259
        check("^....", flags1, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1260
        check(".....^", flags1, t+"\n"+t, t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1261
        check(".....^", flags1, t+"\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1262
        check("....^", flags1, t+"\r\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1263
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1264
        check("^....", flags2, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1265
        check("....^", flags2, t+"\n"+t, t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1266
        check(".....^", flags2, t+"\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1267
        check("....^", flags2, t+"\r\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1268
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1269
        check("^....", flags3, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1270
        check(".....^", flags3, t+"\n"+t, t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1271
        check(".....^", flags3, t+"\u0085"+t, t+"\u0085", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1272
        check(".....^", flags3, t+"\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1273
        check(".....^", flags3, t+"\r\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1274
        check("......^", flags3, t+"\r\n"+t, t+"\r\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1275
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1276
        check("^....", flags4, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1277
        check(".....^", flags3, t+"\n"+t, t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1278
        check(".....^", flags4, t+"\u0085"+t, t+"\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1279
        check(".....^", flags4, t+"\n", t+"\n", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1280
        check(".....^", flags4, t+"\r\n", t+"\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1281
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1282
        report("Caret between terminators");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1283
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1284
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1285
    // This test is for 4727935
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1286
    private static void dollarAtEndTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1287
        int flags1 = Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1288
        int flags2 = Pattern.DOTALL | Pattern.UNIX_LINES;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1289
        int flags3 = Pattern.DOTALL | Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1290
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1291
        check("....$", flags1, "test\n", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1292
        check("....$", flags1, "test\r\n", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1293
        check(".....$", flags1, "test\n", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1294
        check(".....$", flags1, "test\u0085", "test\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1295
        check("....$", flags1, "test\u0085", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1296
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1297
        check("....$", flags2, "test\n", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1298
        check(".....$", flags2, "test\n", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1299
        check(".....$", flags2, "test\u0085", "test\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1300
        check("....$", flags2, "test\u0085", "est\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1301
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1302
        check("....$.blah", flags3, "test\nblah", "test\nblah", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1303
        check(".....$.blah", flags3, "test\n\nblah", "test\n\nblah", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1304
        check("....$blah", flags3, "test\nblah", "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1305
        check(".....$blah", flags3, "test\nblah", "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1306
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1307
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1308
        String t = toSupplementaries("test");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1309
        String b = toSupplementaries("blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1310
        check("....$", flags1, t+"\n", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1311
        check("....$", flags1, t+"\r\n", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1312
        check(".....$", flags1, t+"\n", t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1313
        check(".....$", flags1, t+"\u0085", t+"\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1314
        check("....$", flags1, t+"\u0085", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1315
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1316
        check("....$", flags2, t+"\n", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1317
        check(".....$", flags2, t+"\n", t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1318
        check(".....$", flags2, t+"\u0085", t+"\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1319
        check("....$", flags2, t+"\u0085", toSupplementaries("est\u0085"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1320
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1321
        check("....$."+b, flags3, t+"\n"+b, t+"\n"+b, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1322
        check(".....$."+b, flags3, t+"\n\n"+b, t+"\n\n"+b, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1323
        check("....$"+b, flags3, t+"\n"+b, "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1324
        check(".....$"+b, flags3, t+"\n"+b, "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1325
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1326
        report("Dollar at End");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1327
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1328
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1329
    // This test is for 4711773
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1330
    private static void multilineDollarTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1331
        Pattern findCR = Pattern.compile("$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1332
        Matcher matcher = findCR.matcher("first bit\nsecond bit");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1333
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1334
        if (matcher.start(0) != 9)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1335
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1336
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1337
        if (matcher.start(0) != 20)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1338
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1339
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1340
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1341
        matcher = findCR.matcher(toSupplementaries("first  bit\n second  bit")); // double BMP chars
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1342
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1343
        if (matcher.start(0) != 9*2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1344
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1345
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1346
        if (matcher.start(0) != 20*2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1347
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1348
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1349
        report("Multiline Dollar");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1350
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1351
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1352
    private static void reluctantRepetitionTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1353
        Pattern p = Pattern.compile("1(\\s\\S+?){1,3}?[\\s,]2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1354
        check(p, "1 word word word 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1355
        check(p, "1 wor wo w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1356
        check(p, "1 word word 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1357
        check(p, "1 word 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1358
        check(p, "1 wo w w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1359
        check(p, "1 wo w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1360
        check(p, "1 wor w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1361
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1362
        p = Pattern.compile("([a-z])+?c");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1363
        Matcher m = p.matcher("ababcdefdec");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1364
        check(m, "ababc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1365
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1366
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1367
        p = Pattern.compile(toSupplementaries("([a-z])+?c"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1368
        m = p.matcher(toSupplementaries("ababcdefdec"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1369
        check(m, toSupplementaries("ababc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1370
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1371
        report("Reluctant Repetition");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1372
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1373
48491
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1374
    private static Pattern serializedPattern(Pattern p) throws Exception {
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1375
        ByteArrayOutputStream baos = new ByteArrayOutputStream();
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1376
        ObjectOutputStream oos = new ObjectOutputStream(baos);
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1377
        oos.writeObject(p);
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1378
        oos.close();
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1379
        try (ObjectInputStream ois = new ObjectInputStream(
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1380
                new ByteArrayInputStream(baos.toByteArray()))) {
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1381
            return (Pattern)ois.readObject();
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1382
        }
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1383
    }
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1384
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1385
    private static void serializeTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1386
        String patternStr = "(b)";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1387
        String matchStr = "b";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1388
        Pattern pattern = Pattern.compile(patternStr);
48491
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1389
        Pattern serializedPattern = serializedPattern(pattern);
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1390
        Matcher matcher = serializedPattern.matcher(matchStr);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1391
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1392
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1393
        if (matcher.groupCount() != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1394
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1395
48491
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1396
        pattern = Pattern.compile("a(?-i)b", Pattern.CASE_INSENSITIVE);
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1397
        serializedPattern = serializedPattern(pattern);
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1398
        if (!serializedPattern.matcher("Ab").matches())
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1399
            failCount++;
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1400
        if (serializedPattern.matcher("AB").matches())
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1401
            failCount++;
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1402
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1403
        report("Serialization");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1404
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1405
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1406
    private static void gTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1407
        Pattern pattern = Pattern.compile("\\G\\w");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1408
        Matcher matcher = pattern.matcher("abc#x#x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1409
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1410
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1411
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1412
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1413
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1414
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1415
        pattern = Pattern.compile("\\GA*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1416
        matcher = pattern.matcher("1A2AA3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1417
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1418
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1419
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1420
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1421
        pattern = Pattern.compile("\\GA*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1422
        matcher = pattern.matcher("1A2AA3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1423
        if (!matcher.find(1))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1424
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1425
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1426
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1427
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1428
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1429
        report("\\G");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1430
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1431
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1432
    private static void zTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1433
        Pattern pattern = Pattern.compile("foo\\Z");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1434
        // Positives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1435
        check(pattern, "foo\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1436
        check(pattern, "foo\u2028", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1437
        check(pattern, "foo\u2029", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1438
        check(pattern, "foo\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1439
        check(pattern, "foo\r", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1440
        check(pattern, "foo\r\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1441
        // Negatives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1442
        check(pattern, "fooo", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1443
        check(pattern, "foo\n\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1444
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1445
        pattern = Pattern.compile("foo\\Z", Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1446
        // Positives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1447
        check(pattern, "foo", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1448
        check(pattern, "foo\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1449
        // Negatives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1450
        check(pattern, "foo\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1451
        check(pattern, "foo\u0085", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1452
        check(pattern, "foo\u2028", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1453
        check(pattern, "foo\u2029", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1454
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1455
        report("\\Z");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1456
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1457
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1458
    private static void replaceFirstTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1459
        Pattern pattern = Pattern.compile("(ab)(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1460
        Matcher matcher = pattern.matcher("abccczzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1461
        if (!matcher.replaceFirst("test").equals("testzzzabcczzzabccc"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1462
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1463
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1464
        matcher.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1465
        if (!matcher.replaceFirst("test").equals("zzztestzzzabcczzzabccczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1466
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1467
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1468
        matcher.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1469
        String result = matcher.replaceFirst("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1470
        if (!result.equals("zzzabzzzabcczzzabccczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1471
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1472
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1473
        matcher.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1474
        result = matcher.replaceFirst("$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1475
        if (!result.equals("zzzccczzzabcczzzabccczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1476
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1477
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1478
        pattern = Pattern.compile("a*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1479
        matcher = pattern.matcher("aaaaaaaaaa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1480
        if (!matcher.replaceFirst("test").equals("test"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1481
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1482
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1483
        pattern = Pattern.compile("a+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1484
        matcher = pattern.matcher("zzzaaaaaaaaaa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1485
        if (!matcher.replaceFirst("test").equals("zzztest"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1486
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1487
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1488
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1489
        pattern = Pattern.compile(toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1490
        matcher = pattern.matcher(toSupplementaries("abccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1491
        if (!matcher.replaceFirst(toSupplementaries("test"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1492
                .equals(toSupplementaries("testzzzabcczzzabccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1493
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1494
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1495
        matcher.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1496
        if (!matcher.replaceFirst(toSupplementaries("test")).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1497
            equals(toSupplementaries("zzztestzzzabcczzzabccczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1498
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1499
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1500
        matcher.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1501
        result = matcher.replaceFirst("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1502
        if (!result.equals(toSupplementaries("zzzabzzzabcczzzabccczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1503
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1504
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1505
        matcher.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1506
        result = matcher.replaceFirst("$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1507
        if (!result.equals(toSupplementaries("zzzccczzzabcczzzabccczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1508
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1509
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1510
        pattern = Pattern.compile(toSupplementaries("a*"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1511
        matcher = pattern.matcher(toSupplementaries("aaaaaaaaaa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1512
        if (!matcher.replaceFirst(toSupplementaries("test")).equals(toSupplementaries("test")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1513
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1514
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1515
        pattern = Pattern.compile(toSupplementaries("a+"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1516
        matcher = pattern.matcher(toSupplementaries("zzzaaaaaaaaaa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1517
        if (!matcher.replaceFirst(toSupplementaries("test")).equals(toSupplementaries("zzztest")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1518
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1519
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1520
        report("Replace First");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1521
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1522
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1523
    private static void unixLinesTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1524
        Pattern pattern = Pattern.compile(".*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1525
        Matcher matcher = pattern.matcher("aa\u2028blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1526
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1527
        if (!matcher.group(0).equals("aa"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1528
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1529
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1530
        pattern = Pattern.compile(".*", Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1531
        matcher = pattern.matcher("aa\u2028blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1532
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1533
        if (!matcher.group(0).equals("aa\u2028blah"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1534
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1535
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1536
        pattern = Pattern.compile("[az]$",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1537
                                  Pattern.MULTILINE | Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1538
        matcher = pattern.matcher("aa\u2028zz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1539
        check(matcher, "a\u2028", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1540
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1541
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1542
        pattern = Pattern.compile(".*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1543
        matcher = pattern.matcher(toSupplementaries("aa\u2028blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1544
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1545
        if (!matcher.group(0).equals(toSupplementaries("aa")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1546
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1547
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1548
        pattern = Pattern.compile(".*", Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1549
        matcher = pattern.matcher(toSupplementaries("aa\u2028blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1550
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1551
        if (!matcher.group(0).equals(toSupplementaries("aa\u2028blah")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1552
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1553
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1554
        pattern = Pattern.compile(toSupplementaries("[az]$"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1555
                                  Pattern.MULTILINE | Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1556
        matcher = pattern.matcher(toSupplementaries("aa\u2028zz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1557
        check(matcher, toSupplementaries("a\u2028"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1558
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1559
        report("Unix Lines");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1560
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1561
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1562
    private static void commentsTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1563
        int flags = Pattern.COMMENTS;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1564
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1565
        Pattern pattern = Pattern.compile("aa \\# aa", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1566
        Matcher matcher = pattern.matcher("aa#aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1567
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1568
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1569
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1570
        pattern = Pattern.compile("aa  # blah", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1571
        matcher = pattern.matcher("aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1572
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1573
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1574
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1575
        pattern = Pattern.compile("aa blah", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1576
        matcher = pattern.matcher("aablah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1577
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1578
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1579
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1580
        pattern = Pattern.compile("aa  # blah blech  ", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1581
        matcher = pattern.matcher("aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1582
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1583
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1584
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1585
        pattern = Pattern.compile("aa  # blah\n  ", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1586
        matcher = pattern.matcher("aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1587
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1588
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1589
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1590
        pattern = Pattern.compile("aa  # blah\nbc # blech", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1591
        matcher = pattern.matcher("aabc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1592
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1593
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1594
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1595
        pattern = Pattern.compile("aa  # blah\nbc# blech", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1596
        matcher = pattern.matcher("aabc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1597
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1598
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1599
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1600
        pattern = Pattern.compile("aa  # blah\nbc\\# blech", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1601
        matcher = pattern.matcher("aabc#blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1602
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1603
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1604
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1605
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1606
        pattern = Pattern.compile(toSupplementaries("aa \\# aa"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1607
        matcher = pattern.matcher(toSupplementaries("aa#aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1608
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1609
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1610
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1611
        pattern = Pattern.compile(toSupplementaries("aa  # blah"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1612
        matcher = pattern.matcher(toSupplementaries("aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1613
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1614
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1615
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1616
        pattern = Pattern.compile(toSupplementaries("aa blah"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1617
        matcher = pattern.matcher(toSupplementaries("aablah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1618
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1619
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1620
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1621
        pattern = Pattern.compile(toSupplementaries("aa  # blah blech  "), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1622
        matcher = pattern.matcher(toSupplementaries("aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1623
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1624
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1625
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1626
        pattern = Pattern.compile(toSupplementaries("aa  # blah\n  "), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1627
        matcher = pattern.matcher(toSupplementaries("aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1628
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1629
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1630
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1631
        pattern = Pattern.compile(toSupplementaries("aa  # blah\nbc # blech"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1632
        matcher = pattern.matcher(toSupplementaries("aabc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1633
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1634
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1635
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1636
        pattern = Pattern.compile(toSupplementaries("aa  # blah\nbc# blech"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1637
        matcher = pattern.matcher(toSupplementaries("aabc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1638
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1639
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1640
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1641
        pattern = Pattern.compile(toSupplementaries("aa  # blah\nbc\\# blech"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1642
        matcher = pattern.matcher(toSupplementaries("aabc#blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1643
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1644
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1645
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1646
        report("Comments");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1647
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1648
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1649
    private static void caseFoldingTest() { // bug 4504687
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1650
        int flags = Pattern.CASE_INSENSITIVE | Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1651
        Pattern pattern = Pattern.compile("aa", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1652
        Matcher matcher = pattern.matcher("ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1653
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1654
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1655
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1656
        pattern = Pattern.compile("aA", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1657
        matcher = pattern.matcher("ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1658
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1659
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1660
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1661
        pattern = Pattern.compile("aa", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1662
        matcher = pattern.matcher("aB");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1663
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1664
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1665
        matcher = pattern.matcher("Ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1666
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1667
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1668
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1669
        // ASCII               "a"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1670
        // Latin-1 Supplement  "a" + grave
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1671
        // Cyrillic            "a"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1672
        String[] patterns = new String[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1673
            //single
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1674
            "a", "\u00e0", "\u0430",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1675
            //slice
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1676
            "ab", "\u00e0\u00e1", "\u0430\u0431",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1677
            //class single
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1678
            "[a]", "[\u00e0]", "[\u0430]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1679
            //class range
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1680
            "[a-b]", "[\u00e0-\u00e5]", "[\u0430-\u0431]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1681
            //back reference
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1682
            "(a)\\1", "(\u00e0)\\1", "(\u0430)\\1"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1683
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1684
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1685
        String[] texts = new String[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1686
            "A", "\u00c0", "\u0410",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1687
            "AB", "\u00c0\u00c1", "\u0410\u0411",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1688
            "A", "\u00c0", "\u0410",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1689
            "B", "\u00c2", "\u0411",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1690
            "aA", "\u00e0\u00c0", "\u0430\u0410"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1691
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1692
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1693
        boolean[] expected = new boolean[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1694
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1695
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1696
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1697
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1698
            true, false, false
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1699
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1700
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1701
        flags = Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1702
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1703
            pattern = Pattern.compile(patterns[i], flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1704
            matcher = pattern.matcher(texts[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1705
            if (matcher.matches() != expected[i]) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1706
                System.out.println("<1> Failed at " + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1707
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1708
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1709
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1710
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1711
        flags = Pattern.CASE_INSENSITIVE | Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1712
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1713
            pattern = Pattern.compile(patterns[i], flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1714
            matcher = pattern.matcher(texts[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1715
            if (!matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1716
                System.out.println("<2> Failed at " + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1717
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1718
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1719
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1720
        // flag unicode_case alone should do nothing
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1721
        flags = Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1722
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1723
            pattern = Pattern.compile(patterns[i], flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1724
            matcher = pattern.matcher(texts[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1725
            if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1726
                System.out.println("<3> Failed at " + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1727
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1728
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1729
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1730
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1731
        // Special cases: i, I, u+0131 and u+0130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1732
        flags = Pattern.UNICODE_CASE | Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1733
        pattern = Pattern.compile("[h-j]+", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1734
        if (!pattern.matcher("\u0131\u0130").matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1735
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1736
        report("Case Folding");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1737
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1738
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1739
    private static void appendTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1740
        Pattern pattern = Pattern.compile("(ab)(cd)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1741
        Matcher matcher = pattern.matcher("abcd");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1742
        String result = matcher.replaceAll("$2$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1743
        if (!result.equals("cdab"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1744
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1745
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1746
        String  s1 = "Swap all: first = 123, second = 456";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1747
        String  s2 = "Swap one: first = 123, second = 456";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1748
        String  r  = "$3$2$1";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1749
        pattern = Pattern.compile("([a-z]+)( *= *)([0-9]+)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1750
        matcher = pattern.matcher(s1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1751
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1752
        result = matcher.replaceAll(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1753
        if (!result.equals("Swap all: 123 = first, 456 = second"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1754
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1755
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1756
        matcher = pattern.matcher(s2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1757
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1758
        if (matcher.find()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1759
            StringBuffer sb = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1760
            matcher.appendReplacement(sb, r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1761
            matcher.appendTail(sb);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1762
            result = sb.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1763
            if (!result.equals("Swap one: 123 = first, second = 456"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1764
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1765
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1766
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1767
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1768
        pattern = Pattern.compile(toSupplementaries("(ab)(cd)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1769
        matcher = pattern.matcher(toSupplementaries("abcd"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1770
        result = matcher.replaceAll("$2$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1771
        if (!result.equals(toSupplementaries("cdab")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1772
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1773
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1774
        s1 = toSupplementaries("Swap all: first = 123, second = 456");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1775
        s2 = toSupplementaries("Swap one: first = 123, second = 456");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1776
        r  = toSupplementaries("$3$2$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1777
        pattern = Pattern.compile(toSupplementaries("([a-z]+)( *= *)([0-9]+)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1778
        matcher = pattern.matcher(s1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1779
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1780
        result = matcher.replaceAll(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1781
        if (!result.equals(toSupplementaries("Swap all: 123 = first, 456 = second")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1782
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1783
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1784
        matcher = pattern.matcher(s2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1785
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1786
        if (matcher.find()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1787
            StringBuffer sb = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1788
            matcher.appendReplacement(sb, r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1789
            matcher.appendTail(sb);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1790
            result = sb.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1791
            if (!result.equals(toSupplementaries("Swap one: 123 = first, second = 456")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1792
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1793
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1794
        report("Append");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1795
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1796
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1797
    private static void splitTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1798
        Pattern pattern = Pattern.compile(":");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1799
        String[] result = pattern.split("foo:and:boo", 2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1800
        if (!result[0].equals("foo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1801
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1802
        if (!result[1].equals("and:boo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1803
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1804
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1805
        Pattern patternX = Pattern.compile(toSupplementaries("X"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1806
        result = patternX.split(toSupplementaries("fooXandXboo"), 2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1807
        if (!result[0].equals(toSupplementaries("foo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1808
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1809
        if (!result[1].equals(toSupplementaries("andXboo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1810
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1811
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1812
        CharBuffer cb = CharBuffer.allocate(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1813
        cb.put("foo:and:boo");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1814
        cb.flip();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1815
        result = pattern.split(cb);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1816
        if (!result[0].equals("foo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1817
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1818
        if (!result[1].equals("and"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1819
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1820
        if (!result[2].equals("boo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1821
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1822
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1823
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1824
        CharBuffer cbs = CharBuffer.allocate(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1825
        cbs.put(toSupplementaries("fooXandXboo"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1826
        cbs.flip();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1827
        result = patternX.split(cbs);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1828
        if (!result[0].equals(toSupplementaries("foo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1829
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1830
        if (!result[1].equals(toSupplementaries("and")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1831
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1832
        if (!result[2].equals(toSupplementaries("boo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1833
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1834
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1835
        String source = "0123456789";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1836
        for (int limit=-2; limit<3; limit++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1837
            for (int x=0; x<10; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1838
                result = source.split(Integer.toString(x), limit);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1839
                int expectedLength = limit < 1 ? 2 : limit;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1840
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1841
                if ((limit == 0) && (x == 9)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1842
                    // expected dropping of ""
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1843
                    if (result.length != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1844
                        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1845
                    if (!result[0].equals("012345678")) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1846
                        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1847
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1848
                } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1849
                    if (result.length != expectedLength) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1850
                        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1851
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1852
                    if (!result[0].equals(source.substring(0,x))) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1853
                        if (limit != 1) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1854
                            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1855
                        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1856
                            if (!result[0].equals(source.substring(0,10))) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1857
                                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1858
                            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1859
                        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1860
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1861
                    if (expectedLength > 1) { // Check segment 2
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1862
                        if (!result[1].equals(source.substring(x+1,10)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1863
                            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1864
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1865
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1866
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1867
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1868
        // Check the case for no match found
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1869
        for (int limit=-2; limit<3; limit++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1870
            result = source.split("e", limit);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1871
            if (result.length != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1872
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1873
            if (!result[0].equals(source))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1874
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1875
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1876
        // Check the case for limit == 0, source = "";
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1877
        // split() now returns 0-length for empty source "" see #6559590
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1878
        source = "";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1879
        result = source.split("e", 0);
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1880
        if (result.length != 1)
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1881
            failCount++;
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1882
        if (!result[0].equals(source))
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1883
            failCount++;
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1884
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1885
        // Check both split() and splitAsStraem(), especially for zero-lenth
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1886
        // input and zero-lenth match cases
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1887
        String[][] input = new String[][] {
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1888
            { " ",           "Abc Efg Hij" },   // normal non-zero-match
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1889
            { " ",           " Abc Efg Hij" },  // leading empty str for non-zero-match
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1890
            { " ",           "Abc  Efg Hij" },  // non-zero-match in the middle
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1891
            { "(?=\\p{Lu})", "AbcEfgHij" },     // no leading empty str for zero-match
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1892
            { "(?=\\p{Lu})", "AbcEfg" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1893
            { "(?=\\p{Lu})", "Abc" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1894
            { " ",           "" },              // zero-length input
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1895
            { ".*",          "" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1896
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1897
            // some tests from PatternStreamTest.java
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1898
            { "4",       "awgqwefg1fefw4vssv1vvv1" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1899
            { "\u00a3a", "afbfq\u00a3abgwgb\u00a3awngnwggw\u00a3a\u00a3ahjrnhneerh" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1900
            { "1",       "awgqwefg1fefw4vssv1vvv1" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1901
            { "1",       "a\u4ebafg1fefw\u4eba4\u9f9cvssv\u9f9c1v\u672c\u672cvv" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1902
            { "\u56da",  "1\u56da23\u56da456\u56da7890" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1903
            { "\u56da",  "1\u56da23\u9f9c\u672c\u672c\u56da456\u56da\u9f9c\u672c7890" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1904
            { "\u56da",  "" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1905
            { "[ \t,:.]","This is,testing: with\tdifferent separators." }, //multiple septs
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1906
            { "o",       "boo:and:foo" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1907
            { "o",       "booooo:and:fooooo" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1908
            { "o",       "fooooo:" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1909
        };
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1910
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1911
        String[][] expected = new String[][] {
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1912
            { "Abc", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1913
            { "", "Abc", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1914
            { "Abc", "", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1915
            { "Abc", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1916
            { "Abc", "Efg" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1917
            { "Abc" },
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1918
            { "" },
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1919
            { "" },
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1920
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1921
            { "awgqwefg1fefw", "vssv1vvv1" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1922
            { "afbfq", "bgwgb", "wngnwggw", "", "hjrnhneerh" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1923
            { "awgqwefg", "fefw4vssv", "vvv" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1924
            { "a\u4ebafg", "fefw\u4eba4\u9f9cvssv\u9f9c", "v\u672c\u672cvv" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1925
            { "1", "23", "456", "7890" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1926
            { "1", "23\u9f9c\u672c\u672c", "456", "\u9f9c\u672c7890" },
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1927
            { "" },
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1928
            { "This", "is", "testing", "", "with", "different", "separators" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1929
            { "b", "", ":and:f" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1930
            { "b", "", "", "", "", ":and:f" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1931
            { "f", "", "", "", "", ":" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1932
        };
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1933
        for (int i = 0; i < input.length; i++) {
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1934
            pattern = Pattern.compile(input[i][0]);
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1935
            if (!Arrays.equals(pattern.split(input[i][1]), expected[i])) {
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1936
                failCount++;
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1937
            }
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1938
            if (input[i][1].length() > 0 &&  // splitAsStream() return empty resulting
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1939
                                             // array for zero-length input for now
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1940
                !Arrays.equals(pattern.splitAsStream(input[i][1]).toArray(),
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1941
                               expected[i])) {
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1942
                failCount++;
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1943
            }
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1944
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1945
        report("Split");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1946
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1947
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1948
    private static void negationTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1949
        Pattern pattern = Pattern.compile("[\\[@^]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1950
        Matcher matcher = pattern.matcher("@@@@[[[[^^^^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1951
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1952
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1953
        if (!matcher.group(0).equals("@@@@[[[[^^^^"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1954
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1955
        pattern = Pattern.compile("[@\\[^]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1956
        matcher = pattern.matcher("@@@@[[[[^^^^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1957
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1958
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1959
        if (!matcher.group(0).equals("@@@@[[[[^^^^"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1960
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1961
        pattern = Pattern.compile("[@\\[^@]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1962
        matcher = pattern.matcher("@@@@[[[[^^^^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1963
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1964
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1965
        if (!matcher.group(0).equals("@@@@[[[[^^^^"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1966
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1967
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1968
        pattern = Pattern.compile("\\)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1969
        matcher = pattern.matcher("xxx)xxx");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1970
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1971
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1972
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1973
        report("Negation");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1974
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1975
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1976
    private static void ampersandTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1977
        Pattern pattern = Pattern.compile("[&@]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1978
        check(pattern, "@@@@&&&&", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1979
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1980
        pattern = Pattern.compile("[@&]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1981
        check(pattern, "@@@@&&&&", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1982
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1983
        pattern = Pattern.compile("[@\\&]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1984
        check(pattern, "@@@@&&&&", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1985
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1986
        report("Ampersand");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1987
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1988
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1989
    private static void octalTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1990
        Pattern pattern = Pattern.compile("\\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1991
        Matcher matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1992
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1993
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1994
        pattern = Pattern.compile("\\07");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1995
        matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1996
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1997
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1998
        pattern = Pattern.compile("\\007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1999
        matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2000
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2001
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2002
        pattern = Pattern.compile("\\0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2003
        matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2004
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2005
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2006
        pattern = Pattern.compile("\\040");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2007
        matcher = pattern.matcher("\u0020");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2008
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2009
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2010
        pattern = Pattern.compile("\\0403");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2011
        matcher = pattern.matcher("\u00203");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2012
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2013
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2014
        pattern = Pattern.compile("\\0103");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2015
        matcher = pattern.matcher("\u0043");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2016
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2017
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2018
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2019
        report("Octal");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2020
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2021
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2022
    private static void longPatternTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2023
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2024
            Pattern pattern = Pattern.compile(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2025
                "a 32-character-long pattern xxxx");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2026
            pattern = Pattern.compile("a 33-character-long pattern xxxxx");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2027
            pattern = Pattern.compile("a thirty four character long regex");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2028
            StringBuffer patternToBe = new StringBuffer(101);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2029
            for (int i=0; i<100; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2030
                patternToBe.append((char)(97 + i%26));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2031
            pattern = Pattern.compile(patternToBe.toString());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2032
        } catch (PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2033
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2034
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2035
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2036
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2037
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2038
            Pattern pattern = Pattern.compile(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2039
                toSupplementaries("a 32-character-long pattern xxxx"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2040
            pattern = Pattern.compile(toSupplementaries("a 33-character-long pattern xxxxx"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2041
            pattern = Pattern.compile(toSupplementaries("a thirty four character long regex"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2042
            StringBuffer patternToBe = new StringBuffer(101*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2043
            for (int i=0; i<100; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2044
                patternToBe.append(Character.toChars(Character.MIN_SUPPLEMENTARY_CODE_POINT
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2045
                                                     + 97 + i%26));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2046
            pattern = Pattern.compile(patternToBe.toString());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2047
        } catch (PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2048
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2049
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2050
        report("LongPattern");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2051
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2052
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2053
    private static void group0Test() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2054
        Pattern pattern = Pattern.compile("(tes)ting");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2055
        Matcher matcher = pattern.matcher("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2056
        check(matcher, "testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2057
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2058
        matcher.reset("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2059
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2060
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2061
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2062
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2063
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2064
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2065
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2066
        matcher.reset("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2067
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2068
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2069
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2070
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2071
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2072
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2073
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2074
        pattern = Pattern.compile("(tes)ting");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2075
        matcher = pattern.matcher("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2076
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2077
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2078
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2079
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2080
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2081
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2082
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2083
        pattern = Pattern.compile("^(tes)ting");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2084
        matcher = pattern.matcher("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2085
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2086
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2087
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2088
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2089
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2090
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2091
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2092
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2093
        pattern = Pattern.compile(toSupplementaries("(tes)ting"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2094
        matcher = pattern.matcher(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2095
        check(matcher, toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2096
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2097
        matcher.reset(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2098
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2099
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2100
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2101
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2102
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2103
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2104
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2105
        matcher.reset(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2106
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2107
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2108
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2109
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2110
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2111
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2112
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2113
        pattern = Pattern.compile(toSupplementaries("(tes)ting"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2114
        matcher = pattern.matcher(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2115
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2116
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2117
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2118
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2119
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2120
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2121
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2122
        pattern = Pattern.compile(toSupplementaries("^(tes)ting"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2123
        matcher = pattern.matcher(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2124
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2125
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2126
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2127
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2128
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2129
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2131
        report("Group0");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2132
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2133
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2134
    private static void findIntTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2135
        Pattern p = Pattern.compile("blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2136
        Matcher m = p.matcher("zzzzblahzzzzzblah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2137
        boolean result = m.find(2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2138
        if (!result)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2139
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2140
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2141
        p = Pattern.compile("$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2142
        m = p.matcher("1234567890");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2143
        result = m.find(10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2144
        if (!result)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2145
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2146
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2147
            result = m.find(11);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2148
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2149
        } catch (IndexOutOfBoundsException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2150
            // correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2151
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2152
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2153
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2154
        p = Pattern.compile(toSupplementaries("blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2155
        m = p.matcher(toSupplementaries("zzzzblahzzzzzblah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2156
        result = m.find(2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2157
        if (!result)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2158
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2159
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2160
        report("FindInt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2161
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2162
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2163
    private static void emptyPatternTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2164
        Pattern p = Pattern.compile("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2165
        Matcher m = p.matcher("foo");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2166
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2167
        // Should find empty pattern at beginning of input
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2168
        boolean result = m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2169
        if (result != true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2170
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2171
        if (m.start() != 0)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2172
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2173
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2174
        // Should not match entire input if input is not empty
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2175
        m.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2176
        result = m.matches();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2177
        if (result == true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2178
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2179
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2180
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2181
            m.start(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2182
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2183
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2184
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2185
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2186
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2187
        // Should match entire input if input is empty
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2188
        m.reset("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2189
        result = m.matches();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2190
        if (result != true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2191
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2192
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2193
        result = Pattern.matches("", "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2194
        if (result != true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2195
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2196
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2197
        result = Pattern.matches("", "foo");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2198
        if (result == true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2199
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2200
        report("EmptyPattern");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2201
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2202
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2203
    private static void charClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2204
        Pattern pattern = Pattern.compile("blah[ab]]blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2205
        check(pattern, "blahb]blech", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2206
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2207
        pattern = Pattern.compile("[abc[def]]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2208
        check(pattern, "b", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2209
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2210
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2211
        pattern = Pattern.compile(toSupplementaries("blah[ab]]blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2212
        check(pattern, toSupplementaries("blahb]blech"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2213
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2214
        pattern = Pattern.compile(toSupplementaries("[abc[def]]"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2215
        check(pattern, toSupplementaries("b"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2216
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2217
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2218
            // u00ff when UNICODE_CASE
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2219
            pattern = Pattern.compile("[ab\u00ffcd]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2220
                                      Pattern.CASE_INSENSITIVE|
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2221
                                      Pattern.UNICODE_CASE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2222
            check(pattern, "ab\u00ffcd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2223
            check(pattern, "Ab\u0178Cd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2224
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2225
            // u00b5 when UNICODE_CASE
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2226
            pattern = Pattern.compile("[ab\u00b5cd]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2227
                                      Pattern.CASE_INSENSITIVE|
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2228
                                      Pattern.UNICODE_CASE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2229
            check(pattern, "ab\u00b5cd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2230
            check(pattern, "Ab\u039cCd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2231
        } catch (Exception e) { failCount++; }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2232
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2233
        /* Special cases
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2234
           (1)LatinSmallLetterLongS u+017f
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2235
           (2)LatinSmallLetterDotlessI u+0131
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2236
           (3)LatineCapitalLetterIWithDotAbove u+0130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2237
           (4)KelvinSign u+212a
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2238
           (5)AngstromSign u+212b
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2239
        */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2240
        int flags = Pattern.UNICODE_CASE | Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2241
        pattern = Pattern.compile("[sik\u00c5]+", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2242
        if (!pattern.matcher("\u017f\u0130\u0131\u212a\u212b").matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2243
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2244
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2245
        report("CharClass");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2246
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2247
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2248
    private static void caretTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2249
        Pattern pattern = Pattern.compile("\\w*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2250
        Matcher matcher = pattern.matcher("a#bc#def##g");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2251
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2252
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2253
        check(matcher, "bc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2254
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2255
        check(matcher, "def");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2256
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2257
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2258
        check(matcher, "g");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2259
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2260
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2261
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2262
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2263
        pattern = Pattern.compile("^\\w*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2264
        matcher = pattern.matcher("a#bc#def##g");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2265
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2266
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2267
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2268
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2269
        pattern = Pattern.compile("\\w");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2270
        matcher = pattern.matcher("abc##x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2271
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2272
        check(matcher, "b");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2273
        check(matcher, "c");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2274
        check(matcher, "x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2275
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2276
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2277
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2278
        pattern = Pattern.compile("^\\w");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2279
        matcher = pattern.matcher("abc##x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2280
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2281
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2282
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2283
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2284
        pattern = Pattern.compile("\\A\\p{Alpha}{3}");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2285
        matcher = pattern.matcher("abcdef-ghi\njklmno");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2286
        check(matcher, "abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2287
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2288
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2289
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2290
        pattern = Pattern.compile("^\\p{Alpha}{3}", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2291
        matcher = pattern.matcher("abcdef-ghi\njklmno");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2292
        check(matcher, "abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2293
        check(matcher, "jkl");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2294
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2295
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2296
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2297
        pattern = Pattern.compile("^", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2298
        matcher = pattern.matcher("this is some text");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2299
        String result = matcher.replaceAll("X");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2300
        if (!result.equals("Xthis is some text"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2301
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2302
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2303
        pattern = Pattern.compile("^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2304
        matcher = pattern.matcher("this is some text");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2305
        result = matcher.replaceAll("X");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2306
        if (!result.equals("Xthis is some text"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2307
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2308
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2309
        pattern = Pattern.compile("^", Pattern.MULTILINE | Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2310
        matcher = pattern.matcher("this is some text\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2311
        result = matcher.replaceAll("X");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2312
        if (!result.equals("Xthis is some text\n"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2313
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2314
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2315
        report("Caret");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2316
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2317
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2318
    private static void groupCaptureTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2319
        // Independent group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2320
        Pattern pattern = Pattern.compile("x+(?>y+)z+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2321
        Matcher matcher = pattern.matcher("xxxyyyzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2322
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2323
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2324
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2325
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2326
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2327
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2328
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2329
        // Pure group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2330
        pattern = Pattern.compile("x+(?:y+)z+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2331
        matcher = pattern.matcher("xxxyyyzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2332
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2333
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2334
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2335
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2336
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2337
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2338
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2339
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2340
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2341
        // Independent group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2342
        pattern = Pattern.compile(toSupplementaries("x+(?>y+)z+"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2343
        matcher = pattern.matcher(toSupplementaries("xxxyyyzzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2344
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2345
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2346
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2347
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2348
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2349
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2350
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2351
        // Pure group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2352
        pattern = Pattern.compile(toSupplementaries("x+(?:y+)z+"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2353
        matcher = pattern.matcher(toSupplementaries("xxxyyyzzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2354
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2355
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2356
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2357
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2358
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2359
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2360
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2361
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2362
        report("GroupCapture");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2363
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2364
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2365
    private static void backRefTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2366
        Pattern pattern = Pattern.compile("(a*)bc\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2367
        check(pattern, "zzzaabcazzz", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2368
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2369
        pattern = Pattern.compile("(a*)bc\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2370
        check(pattern, "zzzaabcaazzz", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2371
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2372
        pattern = Pattern.compile("(abc)(def)\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2373
        check(pattern, "abcdefabc", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2374
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2375
        pattern = Pattern.compile("(abc)(def)\\3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2376
        check(pattern, "abcdefabc", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2377
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2378
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2379
            for (int i = 1; i < 10; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2380
                // Make sure backref 1-9 are always accepted
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2381
                pattern = Pattern.compile("abcdef\\" + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2382
                // and fail to match if the target group does not exit
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2383
                check(pattern, "abcdef", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2384
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2385
        } catch(PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2386
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2387
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2388
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2389
        pattern = Pattern.compile("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)\\11");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2390
        check(pattern, "abcdefghija", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2391
        check(pattern, "abcdefghija1", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2392
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2393
        pattern = Pattern.compile("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)(k)\\11");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2394
        check(pattern, "abcdefghijkk", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2395
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2396
        pattern = Pattern.compile("(a)bcdefghij\\11");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2397
        check(pattern, "abcdefghija1", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2398
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2399
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2400
        pattern = Pattern.compile(toSupplementaries("(a*)bc\\1"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2401
        check(pattern, toSupplementaries("zzzaabcazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2402
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2403
        pattern = Pattern.compile(toSupplementaries("(a*)bc\\1"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2404
        check(pattern, toSupplementaries("zzzaabcaazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2405
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2406
        pattern = Pattern.compile(toSupplementaries("(abc)(def)\\1"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2407
        check(pattern, toSupplementaries("abcdefabc"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2408
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2409
        pattern = Pattern.compile(toSupplementaries("(abc)(def)\\3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2410
        check(pattern, toSupplementaries("abcdefabc"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2411
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2412
        pattern = Pattern.compile(toSupplementaries("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)\\11"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2413
        check(pattern, toSupplementaries("abcdefghija"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2414
        check(pattern, toSupplementaries("abcdefghija1"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2415
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2416
        pattern = Pattern.compile(toSupplementaries("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)(k)\\11"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2417
        check(pattern, toSupplementaries("abcdefghijkk"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2418
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2419
        report("BackRef");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2420
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2421
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2422
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2423
     * Unicode Technical Report #18, section 2.6 End of Line
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2424
     * There is no empty line to be matched in the sequence \u000D\u000A
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2425
     * but there is an empty line in the sequence \u000A\u000D.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2426
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2427
    private static void anchorTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2428
        Pattern p = Pattern.compile("^.*$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2429
        Matcher m = p.matcher("blah1\r\nblah2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2430
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2431
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2432
        if (!m.group().equals("blah2"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2433
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2434
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2435
        m.reset("blah1\n\rblah2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2436
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2437
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2438
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2439
        if (!m.group().equals("blah2"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2440
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2441
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2442
        // Test behavior of $ with \r\n at end of input
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2443
        p = Pattern.compile(".+$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2444
        m = p.matcher("blah1\r\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2445
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2446
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2447
       if (!m.group().equals("blah1"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2448
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2449
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2450
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2451
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2452
        // Test behavior of $ with \r\n at end of input in multiline
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2453
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2454
        m = p.matcher("blah1\r\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2455
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2456
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2457
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2458
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2459
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2460
        // Test for $ recognition of \u0085 for bug 4527731
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2461
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2462
        m = p.matcher("blah1\u0085");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2463
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2464
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2465
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2466
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2467
        p = Pattern.compile("^.*$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2468
        m = p.matcher(toSupplementaries("blah1\r\nblah2"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2469
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2470
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2471
        if (!m.group().equals(toSupplementaries("blah2")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2472
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2473
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2474
        m.reset(toSupplementaries("blah1\n\rblah2"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2475
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2476
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2477
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2478
        if (!m.group().equals(toSupplementaries("blah2")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2479
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2480
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2481
        // Test behavior of $ with \r\n at end of input
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2482
        p = Pattern.compile(".+$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2483
        m = p.matcher(toSupplementaries("blah1\r\n"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2484
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2485
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2486
        if (!m.group().equals(toSupplementaries("blah1")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2487
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2488
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2489
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2490
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2491
        // Test behavior of $ with \r\n at end of input in multiline
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2492
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2493
        m = p.matcher(toSupplementaries("blah1\r\n"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2494
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2495
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2496
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2497
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2498
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2499
        // Test for $ recognition of \u0085 for bug 4527731
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2500
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2501
        m = p.matcher(toSupplementaries("blah1\u0085"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2502
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2503
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2504
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2505
        report("Anchors");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2506
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2507
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2508
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2509
     * A basic sanity test of Matcher.lookingAt().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2510
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2511
    private static void lookingAtTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2512
        Pattern p = Pattern.compile("(ab)(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2513
        Matcher m = p.matcher("abccczzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2514
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2515
        if (!m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2516
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2517
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2518
        if (!m.group().equals(m.group(0)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2519
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2520
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2521
        m = p.matcher("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2522
        if (m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2523
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2524
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2525
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2526
        p = Pattern.compile(toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2527
        m = p.matcher(toSupplementaries("abccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2528
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2529
        if (!m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2530
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2531
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2532
        if (!m.group().equals(m.group(0)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2533
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2534
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2535
        m = p.matcher(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2536
        if (m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2537
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2538
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2539
        report("Looking At");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2540
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2541
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2542
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2543
     * A basic sanity test of Matcher.matches().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2544
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2545
    private static void matchesTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2546
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2547
        Pattern p = Pattern.compile("ulb(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2548
        Matcher m = p.matcher("ulbcccccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2549
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2550
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2551
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2552
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2553
        m.reset("zzzulbcccccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2554
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2555
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2556
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2557
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2558
        m.reset("ulbccccccdef");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2559
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2560
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2561
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2562
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2563
        p = Pattern.compile("a|ad");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2564
        m = p.matcher("ad");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2565
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2566
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2567
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2568
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2569
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2570
        p = Pattern.compile(toSupplementaries("ulb(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2571
        m = p.matcher(toSupplementaries("ulbcccccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2572
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2573
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2574
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2575
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2576
        m.reset(toSupplementaries("zzzulbcccccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2577
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2578
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2579
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2580
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2581
        m.reset(toSupplementaries("ulbccccccdef"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2582
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2583
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2584
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2585
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2586
        p = Pattern.compile(toSupplementaries("a|ad"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2587
        m = p.matcher(toSupplementaries("ad"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2588
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2589
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2590
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2591
        report("Matches");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2592
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2593
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2594
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2595
     * A basic sanity test of Pattern.matches().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2596
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2597
    private static void patternMatchesTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2598
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2599
        if (!Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2600
                             toSupplementaries("ulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2601
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2602
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2603
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2604
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2605
                            toSupplementaries("zzzulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2606
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2607
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2608
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2609
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2610
                            toSupplementaries("ulbccccccdef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2611
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2612
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2613
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2614
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2615
        if (!Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2616
                             toSupplementaries("ulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2617
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2618
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2619
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2620
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2621
                            toSupplementaries("zzzulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2622
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2623
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2624
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2625
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2626
                            toSupplementaries("ulbccccccdef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2627
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2628
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2629
        report("Pattern Matches");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2630
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2631
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2632
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2633
     * Canonical equivalence testing. Tests the ability of the engine
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2634
     * to match sequences that are not explicitly specified in the
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2635
     * pattern when they are considered equivalent by the Unicode Standard.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2636
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2637
    private static void ceTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2638
        // Decomposed char outside char classes
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2639
        Pattern p = Pattern.compile("testa\u030a", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2640
        Matcher m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2641
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2642
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2643
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2644
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2645
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2646
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2647
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2648
        // Composed char outside char classes
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2649
        p = Pattern.compile("test\u00e5", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2650
        m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2651
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2652
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2653
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2654
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2655
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2656
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2657
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2658
        // Decomposed char inside a char class
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2659
        p = Pattern.compile("test[abca\u030a]", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2660
        m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2661
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2662
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2663
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2664
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2665
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2666
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2667
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2668
        // Composed char inside a char class
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2669
        p = Pattern.compile("test[abc\u00e5def\u00e0]", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2670
        m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2671
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2672
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2673
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2674
        m.reset("testa\u0300");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2675
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2676
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2677
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2678
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2679
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2680
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2681
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2682
        // Marks that cannot legally change order and be equivalent
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2683
        p = Pattern.compile("testa\u0308\u0300", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2684
        check(p, "testa\u0308\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2685
        check(p, "testa\u0300\u0308", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2686
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2687
        // Marks that can legally change order and be equivalent
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2688
        p = Pattern.compile("testa\u0308\u0323", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2689
        check(p, "testa\u0308\u0323", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2690
        check(p, "testa\u0323\u0308", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2691
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2692
        // Test all equivalences of the sequence a\u0308\u0323\u0300
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2693
        p = Pattern.compile("testa\u0308\u0323\u0300", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2694
        check(p, "testa\u0308\u0323\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2695
        check(p, "testa\u0323\u0308\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2696
        check(p, "testa\u0308\u0300\u0323", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2697
        check(p, "test\u00e4\u0323\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2698
        check(p, "test\u00e4\u0300\u0323", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2699
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2700
        Object[][] data = new Object[][] {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2701
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2702
        // JDK-4867170
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2703
        { "[\u1f80-\u1f82]", "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2704
        { "[\u1f80-\u1f82]", "ab\u1f81cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2705
        { "[\u1f80-\u1f82]", "ab\u1f82cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2706
        { "[\u1f80-\u1f82]", "ab\u03b1\u0314\u0345cd", "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2707
        { "[\u1f80-\u1f82]", "ab\u03b1\u0345\u0314cd", "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2708
        { "[\u1f80-\u1f82]", "ab\u1f01\u0345cd",       "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2709
        { "[\u1f80-\u1f82]", "ab\u1f00\u0345cd",       "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2710
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2711
        { "\\p{IsGreek}",    "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2712
        { "\\p{IsGreek}",    "ab\u1f81cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2713
        { "\\p{IsGreek}",    "ab\u1f82cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2714
        { "\\p{IsGreek}",    "ab\u03b1\u0314\u0345cd", "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2715
        { "\\p{IsGreek}",    "ab\u1f01\u0345cd",       "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2716
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2717
        // backtracking, force to match "\u1f80", instead of \u1f82"
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2718
        { "ab\\p{IsGreek}\u0300cd", "ab\u03b1\u0313\u0345\u0300cd", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2719
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2720
        { "[\\p{IsGreek}]",  "\u03b1\u0314\u0345",     "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2721
        { "\\p{IsGreek}",    "\u03b1\u0314\u0345",     "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2722
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2723
        { "[^\u1f80-\u1f82]","\u1f81",                 "m", false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2724
        { "[^\u1f80-\u1f82]","\u03b1\u0314\u0345",     "m", false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2725
        { "[^\u1f01\u0345]", "\u1f81",                 "f", false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2726
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2727
        { "[^\u1f81]+",      "\u1f80\u1f82",           "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2728
        { "[\u1f80]",        "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2729
        { "\u1f80",          "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2730
        { "\u1f00\u0345\u0300",  "\u1f82", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2731
        { "\u1f80",          "-\u1f00\u0345\u0300-",   "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2732
        { "\u1f82",          "\u1f00\u0345\u0300",     "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2733
        { "\u1f82",          "\u1f80\u0300",           "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2734
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2735
        // JDK-7080302       # compile failed
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2736
        { "a(\u0041\u0301\u0328)", "a\u0041\u0301\u0328", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2737
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2738
        // JDK-6728861, same cause as above one
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2739
        { "\u00e9\u00e9n", "e\u0301e\u0301n", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2740
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2741
        // JDK-6995635
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2742
        { "(\u00e9)", "e\u0301", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2743
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2744
        // JDK-6736245
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2745
        // intereting special case, nfc(u2add+u0338) -> u2add+u0338) NOT u2adc
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2746
        { "\u2ADC", "\u2ADC", "m", true},          // NFC
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2747
        { "\u2ADC", "\u2ADD\u0338", "m", true},    // NFD
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2748
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2749
        //  4916384.
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2750
        // Decomposed hangul (jamos) works inside clazz
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2751
        { "[\u1100\u1161]", "\u1100\u1161", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2752
        { "[\u1100\u1161]", "\uac00", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2753
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2754
        { "[\uac00]", "\u1100\u1161", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2755
        { "[\uac00]", "\uac00", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2756
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2757
        // Decomposed hangul (jamos)
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2758
        { "\u1100\u1161", "\u1100\u1161", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2759
        { "\u1100\u1161", "\uac00", "m", true},
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2760
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2761
        // Composed hangul
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2762
        { "\uac00",  "\u1100\u1161", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2763
        { "\uac00",  "\uac00", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2764
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2765
        /* Need a NFDSlice to nfd the source to solve this issue
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2766
           u+1d1c0 -> nfd: <u+1d1ba><u+1d165><u+1d16f>  -> nfc: <u+1d1ba><u+1d165><u+1d16f>
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2767
           u+1d1bc -> nfd: <u+1d1ba><u+1d165>           -> nfc: <u+1d1ba><u+1d165>
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2768
           <u+1d1bc><u+1d16f> -> nfd: <u+1d1ba><u+1d165><u+1d16f> -> nfc: <u+1d1ba><u+1d165><u+1d16f>
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2769
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2770
        // Decomposed supplementary outside char classes
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2771
        // { "test\ud834\uddbc\ud834\udd6f", "test\ud834\uddc0", "m", true },
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2772
        // Composed supplementary outside char classes
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2773
        // { "test\ud834\uddc0", "test\ud834\uddbc\ud834\udd6f", "m", true },
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2774
        */
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2775
        { "test\ud834\uddbc\ud834\udd6f", "test\ud834\uddbc\ud834\udd6f", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2776
        { "test\ud834\uddc0",             "test\ud834\uddbc\ud834\udd6f", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2777
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2778
        { "test\ud834\uddc0",             "test\ud834\uddc0",             "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2779
        { "test\ud834\uddbc\ud834\udd6f", "test\ud834\uddc0",             "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2780
        };
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2781
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2782
        int failCount = 0;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2783
        for (Object[] d : data) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2784
            String pn = (String)d[0];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2785
            String tt = (String)d[1];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2786
            boolean isFind = "f".equals(((String)d[2]));
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2787
            boolean expected = (boolean)d[3];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2788
            boolean ret = isFind ? Pattern.compile(pn, Pattern.CANON_EQ).matcher(tt).find()
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2789
                                 : Pattern.compile(pn, Pattern.CANON_EQ).matcher(tt).matches();
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2790
            if (ret != expected) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2791
                failCount++;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2792
                continue;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2793
            }
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2794
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2795
        report("Canonical Equivalence");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2796
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2797
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2798
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2799
     * A basic sanity test of Matcher.replaceAll().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2800
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2801
    private static void globalSubstitute() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2802
        // Global substitution with a literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2803
        Pattern p = Pattern.compile("(ab)(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2804
        Matcher m = p.matcher("abccczzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2805
        if (!m.replaceAll("test").equals("testzzztestzzztest"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2806
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2807
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2808
        m.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2809
        if (!m.replaceAll("test").equals("zzztestzzztestzzztestzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2810
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2811
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2812
        // Global substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2813
        m.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2814
        String result = m.replaceAll("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2815
        if (!result.equals("zzzabzzzabzzzabzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2816
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2817
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2818
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2819
        // Global substitution with a literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2820
        p = Pattern.compile(toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2821
        m = p.matcher(toSupplementaries("abccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2822
        if (!m.replaceAll(toSupplementaries("test")).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2823
            equals(toSupplementaries("testzzztestzzztest")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2824
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2825
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2826
        m.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2827
        if (!m.replaceAll(toSupplementaries("test")).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2828
            equals(toSupplementaries("zzztestzzztestzzztestzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2829
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2830
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2831
        // Global substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2832
        m.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2833
        result = m.replaceAll("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2834
        if (!result.equals(toSupplementaries("zzzabzzzabzzzabzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2835
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2836
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2837
        report("Global Substitution");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2838
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2839
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2840
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2841
     * Tests the usage of Matcher.appendReplacement() with literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2842
     * and group substitutions.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2843
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2844
    private static void stringbufferSubstitute() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2845
        // SB substitution with literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2846
        String blah = "zzzblahzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2847
        Pattern p = Pattern.compile("blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2848
        Matcher m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2849
        StringBuffer result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2850
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2851
            m.appendReplacement(result, "blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2852
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2853
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2854
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2855
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2856
        m.appendReplacement(result, "blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2857
        if (!result.toString().equals("zzzblech"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2858
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2859
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2860
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2861
        if (!result.toString().equals("zzzblechzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2862
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2863
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2864
        // SB substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2865
        blah = "zzzabcdzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2866
        p = Pattern.compile("(ab)(cd)*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2867
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2868
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2869
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2870
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2871
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2872
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2873
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2874
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2875
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2876
        if (!result.toString().equals("zzzab"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2877
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2878
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2879
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2880
        if (!result.toString().equals("zzzabzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2881
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2882
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2883
        // SB substitution with 3 groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2884
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2885
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2886
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2887
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2888
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2889
            m.appendReplacement(result, "$1w$2w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2890
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2891
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2892
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2893
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2894
        m.appendReplacement(result, "$1w$2w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2895
        if (!result.toString().equals("zzzabwcdwef"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2896
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2897
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2898
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2899
        if (!result.toString().equals("zzzabwcdwefzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2900
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2901
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2902
        // SB substitution with groups and three matches
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2903
        // skipping middle match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2904
        blah = "zzzabcdzzzabcddzzzabcdzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2905
        p = Pattern.compile("(ab)(cd*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2906
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2907
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2908
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2909
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2910
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2911
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2912
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2913
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2914
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2915
        if (!result.toString().equals("zzzab"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2916
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2917
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2918
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2919
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2920
        m.appendReplacement(result, "$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2921
        if (!result.toString().equals("zzzabzzzabcddzzzcd"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2922
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2923
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2924
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2925
        if (!result.toString().equals("zzzabzzzabcddzzzcdzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2926
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2927
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2928
        // Check to make sure escaped $ is ignored
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2929
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2930
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2931
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2932
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2933
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2934
        m.appendReplacement(result, "$1w\\$2w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2935
        if (!result.toString().equals("zzzabw$2wef"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2936
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2937
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2938
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2939
        if (!result.toString().equals("zzzabw$2wefzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2940
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2941
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2942
        // Check to make sure a reference to nonexistent group causes error
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2943
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2944
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2945
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2946
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2947
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2948
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2949
            m.appendReplacement(result, "$1w$5w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2950
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2951
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2952
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2953
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2954
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2955
        // Check double digit group references
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2956
        blah = "zzz123456789101112zzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2957
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2958
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2959
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2960
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2961
        m.appendReplacement(result, "$1w$11w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2962
        if (!result.toString().equals("zzz1w11w3"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2963
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2964
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2965
        // Check to make sure it backs off $15 to $1 if only three groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2966
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2967
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2968
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2969
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2970
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2971
        m.appendReplacement(result, "$1w$15w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2972
        if (!result.toString().equals("zzzabwab5wef"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2973
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2974
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2975
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2976
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2977
        // SB substitution with literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2978
        blah = toSupplementaries("zzzblahzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2979
        p = Pattern.compile(toSupplementaries("blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2980
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2981
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2982
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2983
            m.appendReplacement(result, toSupplementaries("blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2984
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2985
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2986
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2987
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2988
        m.appendReplacement(result, toSupplementaries("blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2989
        if (!result.toString().equals(toSupplementaries("zzzblech")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2990
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2991
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2992
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2993
        if (!result.toString().equals(toSupplementaries("zzzblechzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2994
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2995
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2996
        // SB substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2997
        blah = toSupplementaries("zzzabcdzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2998
        p = Pattern.compile(toSupplementaries("(ab)(cd)*"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2999
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3000
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3001
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3002
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3003
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3004
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3005
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3006
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3007
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3008
        if (!result.toString().equals(toSupplementaries("zzzab")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3009
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3010
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3011
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3012
        if (!result.toString().equals(toSupplementaries("zzzabzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3013
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3014
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3015
        // SB substitution with 3 groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3016
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3017
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3018
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3019
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3020
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3021
            m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3022
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3023
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3024
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3025
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3026
        m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3027
        if (!result.toString().equals(toSupplementaries("zzzabwcdwef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3028
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3029
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3030
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3031
        if (!result.toString().equals(toSupplementaries("zzzabwcdwefzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3032
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3033
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3034
        // SB substitution with groups and three matches
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3035
        // skipping middle match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3036
        blah = toSupplementaries("zzzabcdzzzabcddzzzabcdzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3037
        p = Pattern.compile(toSupplementaries("(ab)(cd*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3038
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3039
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3040
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3041
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3042
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3043
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3044
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3045
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3046
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3047
        if (!result.toString().equals(toSupplementaries("zzzab")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3048
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3049
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3050
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3051
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3052
        m.appendReplacement(result, "$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3053
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcd")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3054
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3055
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3056
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3057
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcdzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3058
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3059
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3060
        // Check to make sure escaped $ is ignored
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3061
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3062
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3063
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3064
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3065
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3066
        m.appendReplacement(result, toSupplementaries("$1w\\$2w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3067
        if (!result.toString().equals(toSupplementaries("zzzabw$2wef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3068
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3069
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3070
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3071
        if (!result.toString().equals(toSupplementaries("zzzabw$2wefzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3072
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3073
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3074
        // Check to make sure a reference to nonexistent group causes error
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3075
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3076
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3077
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3078
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3079
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3080
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3081
            m.appendReplacement(result, toSupplementaries("$1w$5w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3082
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3083
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3084
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3085
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3086
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3087
        // Check double digit group references
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3088
        blah = toSupplementaries("zzz123456789101112zzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3089
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3090
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3091
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3092
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3093
        m.appendReplacement(result, toSupplementaries("$1w$11w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3094
        if (!result.toString().equals(toSupplementaries("zzz1w11w3")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3095
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3096
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3097
        // Check to make sure it backs off $15 to $1 if only three groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3098
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3099
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3100
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3101
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3102
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3103
        m.appendReplacement(result, toSupplementaries("$1w$15w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3104
        if (!result.toString().equals(toSupplementaries("zzzabwab5wef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3105
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3106
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3107
        // Check nothing has been appended into the output buffer if
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3108
        // the replacement string triggers IllegalArgumentException.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3109
        p = Pattern.compile("(abc)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3110
        m = p.matcher("abcd");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3111
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3112
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3113
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3114
            m.appendReplacement(result, ("xyz$g"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3115
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3116
        } catch (IllegalArgumentException iae) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3117
            if (result.length() != 0)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3118
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3119
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3120
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3121
        report("SB Substitution");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3122
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3123
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3124
    /**
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3125
     * Tests the usage of Matcher.appendReplacement() with literal
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3126
     * and group substitutions.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3127
     */
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3128
    private static void stringbuilderSubstitute() throws Exception {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3129
        // SB substitution with literal
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3130
        String blah = "zzzblahzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3131
        Pattern p = Pattern.compile("blah");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3132
        Matcher m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3133
        StringBuilder result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3134
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3135
            m.appendReplacement(result, "blech");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3136
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3137
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3138
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3139
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3140
        m.appendReplacement(result, "blech");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3141
        if (!result.toString().equals("zzzblech"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3142
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3143
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3144
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3145
        if (!result.toString().equals("zzzblechzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3146
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3147
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3148
        // SB substitution with groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3149
        blah = "zzzabcdzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3150
        p = Pattern.compile("(ab)(cd)*");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3151
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3152
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3153
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3154
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3155
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3156
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3157
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3158
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3159
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3160
        if (!result.toString().equals("zzzab"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3161
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3162
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3163
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3164
        if (!result.toString().equals("zzzabzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3165
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3166
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3167
        // SB substitution with 3 groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3168
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3169
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3170
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3171
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3172
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3173
            m.appendReplacement(result, "$1w$2w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3174
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3175
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3176
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3177
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3178
        m.appendReplacement(result, "$1w$2w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3179
        if (!result.toString().equals("zzzabwcdwef"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3180
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3181
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3182
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3183
        if (!result.toString().equals("zzzabwcdwefzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3184
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3185
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3186
        // SB substitution with groups and three matches
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3187
        // skipping middle match
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3188
        blah = "zzzabcdzzzabcddzzzabcdzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3189
        p = Pattern.compile("(ab)(cd*)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3190
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3191
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3192
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3193
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3194
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3195
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3196
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3197
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3198
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3199
        if (!result.toString().equals("zzzab"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3200
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3201
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3202
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3203
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3204
        m.appendReplacement(result, "$2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3205
        if (!result.toString().equals("zzzabzzzabcddzzzcd"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3206
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3207
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3208
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3209
        if (!result.toString().equals("zzzabzzzabcddzzzcdzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3210
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3211
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3212
        // Check to make sure escaped $ is ignored
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3213
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3214
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3215
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3216
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3217
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3218
        m.appendReplacement(result, "$1w\\$2w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3219
        if (!result.toString().equals("zzzabw$2wef"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3220
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3221
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3222
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3223
        if (!result.toString().equals("zzzabw$2wefzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3224
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3225
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3226
        // Check to make sure a reference to nonexistent group causes error
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3227
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3228
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3229
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3230
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3231
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3232
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3233
            m.appendReplacement(result, "$1w$5w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3234
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3235
        } catch (IndexOutOfBoundsException ioobe) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3236
            // Correct result
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3237
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3238
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3239
        // Check double digit group references
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3240
        blah = "zzz123456789101112zzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3241
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3242
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3243
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3244
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3245
        m.appendReplacement(result, "$1w$11w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3246
        if (!result.toString().equals("zzz1w11w3"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3247
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3248
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3249
        // Check to make sure it backs off $15 to $1 if only three groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3250
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3251
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3252
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3253
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3254
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3255
        m.appendReplacement(result, "$1w$15w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3256
        if (!result.toString().equals("zzzabwab5wef"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3257
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3258
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3259
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3260
        // Supplementary character test
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3261
        // SB substitution with literal
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3262
        blah = toSupplementaries("zzzblahzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3263
        p = Pattern.compile(toSupplementaries("blah"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3264
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3265
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3266
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3267
            m.appendReplacement(result, toSupplementaries("blech"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3268
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3269
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3270
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3271
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3272
        m.appendReplacement(result, toSupplementaries("blech"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3273
        if (!result.toString().equals(toSupplementaries("zzzblech")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3274
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3275
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3276
        if (!result.toString().equals(toSupplementaries("zzzblechzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3277
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3278
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3279
        // SB substitution with groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3280
        blah = toSupplementaries("zzzabcdzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3281
        p = Pattern.compile(toSupplementaries("(ab)(cd)*"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3282
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3283
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3284
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3285
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3286
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3287
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3288
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3289
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3290
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3291
        if (!result.toString().equals(toSupplementaries("zzzab")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3292
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3293
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3294
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3295
        if (!result.toString().equals(toSupplementaries("zzzabzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3296
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3297
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3298
        // SB substitution with 3 groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3299
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3300
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3301
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3302
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3303
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3304
            m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3305
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3306
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3307
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3308
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3309
        m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3310
        if (!result.toString().equals(toSupplementaries("zzzabwcdwef")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3311
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3312
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3313
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3314
        if (!result.toString().equals(toSupplementaries("zzzabwcdwefzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3315
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3316
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3317
        // SB substitution with groups and three matches
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3318
        // skipping middle match
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3319
        blah = toSupplementaries("zzzabcdzzzabcddzzzabcdzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3320
        p = Pattern.compile(toSupplementaries("(ab)(cd*)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3321
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3322
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3323
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3324
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3325
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3326
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3327
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3328
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3329
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3330
        if (!result.toString().equals(toSupplementaries("zzzab")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3331
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3332
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3333
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3334
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3335
        m.appendReplacement(result, "$2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3336
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcd")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3337
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3338
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3339
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3340
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcdzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3341
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3342
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3343
        // Check to make sure escaped $ is ignored
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3344
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3345
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3346
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3347
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3348
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3349
        m.appendReplacement(result, toSupplementaries("$1w\\$2w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3350
        if (!result.toString().equals(toSupplementaries("zzzabw$2wef")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3351
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3352
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3353
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3354
        if (!result.toString().equals(toSupplementaries("zzzabw$2wefzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3355
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3356
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3357
        // Check to make sure a reference to nonexistent group causes error
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3358
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3359
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3360
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3361
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3362
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3363
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3364
            m.appendReplacement(result, toSupplementaries("$1w$5w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3365
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3366
        } catch (IndexOutOfBoundsException ioobe) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3367
            // Correct result
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3368
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3369
        // Check double digit group references
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3370
        blah = toSupplementaries("zzz123456789101112zzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3371
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3372
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3373
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3374
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3375
        m.appendReplacement(result, toSupplementaries("$1w$11w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3376
        if (!result.toString().equals(toSupplementaries("zzz1w11w3")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3377
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3378
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3379
        // Check to make sure it backs off $15 to $1 if only three groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3380
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3381
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3382
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3383
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3384
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3385
        m.appendReplacement(result, toSupplementaries("$1w$15w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3386
        if (!result.toString().equals(toSupplementaries("zzzabwab5wef")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3387
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3388
        // Check nothing has been appended into the output buffer if
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3389
        // the replacement string triggers IllegalArgumentException.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3390
        p = Pattern.compile("(abc)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3391
        m = p.matcher("abcd");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3392
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3393
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3394
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3395
            m.appendReplacement(result, ("xyz$g"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3396
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3397
        } catch (IllegalArgumentException iae) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3398
            if (result.length() != 0)
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3399
                failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3400
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3401
        report("SB Substitution 2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3402
    }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3403
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3404
    /*
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3405
     * 5 groups of characters are created to make a substitution string.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3406
     * A base string will be created including random lead chars, the
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3407
     * substitution string, and random trailing chars.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3408
     * A pattern containing the 5 groups is searched for and replaced with:
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3409
     * random group + random string + random group.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3410
     * The results are checked for correctness.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3411
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3412
    private static void substitutionBasher() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3413
        for (int runs = 0; runs<1000; runs++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3414
            // Create a base string to work in
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3415
            int leadingChars = generator.nextInt(10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3416
            StringBuffer baseBuffer = new StringBuffer(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3417
            String leadingString = getRandomAlphaString(leadingChars);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3418
            baseBuffer.append(leadingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3419
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3420
            // Create 5 groups of random number of random chars
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3421
            // Create the string to substitute
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3422
            // Create the pattern string to search for
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3423
            StringBuffer bufferToSub = new StringBuffer(25);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3424
            StringBuffer bufferToPat = new StringBuffer(50);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3425
            String[] groups = new String[5];
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3426
            for(int i=0; i<5; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3427
                int aGroupSize = generator.nextInt(5)+1;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3428
                groups[i] = getRandomAlphaString(aGroupSize);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3429
                bufferToSub.append(groups[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3430
                bufferToPat.append('(');
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3431
                bufferToPat.append(groups[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3432
                bufferToPat.append(')');
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3433
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3434
            String stringToSub = bufferToSub.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3435
            String pattern = bufferToPat.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3436
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3437
            // Place sub string into working string at random index
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3438
            baseBuffer.append(stringToSub);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3439
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3440
            // Append random chars to end
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3441
            int trailingChars = generator.nextInt(10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3442
            String trailingString = getRandomAlphaString(trailingChars);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3443
            baseBuffer.append(trailingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3444
            String baseString = baseBuffer.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3445
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3446
            // Create test pattern and matcher
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3447
            Pattern p = Pattern.compile(pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3448
            Matcher m = p.matcher(baseString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3449
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3450
            // Reject candidate if pattern happens to start early
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3451
            m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3452
            if (m.start() < leadingChars)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3453
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3454
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3455
            // Reject candidate if more than one match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3456
            if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3457
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3458
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3459
            // Construct a replacement string with :
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3460
            // random group + random string + random group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3461
            StringBuffer bufferToRep = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3462
            int groupIndex1 = generator.nextInt(5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3463
            bufferToRep.append("$" + (groupIndex1 + 1));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3464
            String randomMidString = getRandomAlphaString(5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3465
            bufferToRep.append(randomMidString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3466
            int groupIndex2 = generator.nextInt(5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3467
            bufferToRep.append("$" + (groupIndex2 + 1));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3468
            String replacement = bufferToRep.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3469
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3470
            // Do the replacement
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3471
            String result = m.replaceAll(replacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3472
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3473
            // Construct expected result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3474
            StringBuffer bufferToRes = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3475
            bufferToRes.append(leadingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3476
            bufferToRes.append(groups[groupIndex1]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3477
            bufferToRes.append(randomMidString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3478
            bufferToRes.append(groups[groupIndex2]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3479
            bufferToRes.append(trailingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3480
            String expectedResult = bufferToRes.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3481
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3482
            // Check results
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3483
            if (!result.equals(expectedResult))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3484
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3485
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3486
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3487
        report("Substitution Basher");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3488
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3489
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3490
    /*
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3491
     * 5 groups of characters are created to make a substitution string.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3492
     * A base string will be created including random lead chars, the
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3493
     * substitution string, and random trailing chars.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3494
     * A pattern containing the 5 groups is searched for and replaced with:
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3495
     * random group + random string + random group.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3496
     * The results are checked for correctness.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3497
     */
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3498
    private static void substitutionBasher2() {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3499
        for (int runs = 0; runs<1000; runs++) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3500
            // Create a base string to work in
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3501
            int leadingChars = generator.nextInt(10);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3502
            StringBuilder baseBuffer = new StringBuilder(100);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3503
            String leadingString = getRandomAlphaString(leadingChars);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3504
            baseBuffer.append(leadingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3505
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3506
            // Create 5 groups of random number of random chars
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3507
            // Create the string to substitute
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3508
            // Create the pattern string to search for
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3509
            StringBuilder bufferToSub = new StringBuilder(25);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3510
            StringBuilder bufferToPat = new StringBuilder(50);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3511
            String[] groups = new String[5];
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3512
            for(int i=0; i<5; i++) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3513
                int aGroupSize = generator.nextInt(5)+1;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3514
                groups[i] = getRandomAlphaString(aGroupSize);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3515
                bufferToSub.append(groups[i]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3516
                bufferToPat.append('(');
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3517
                bufferToPat.append(groups[i]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3518
                bufferToPat.append(')');
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3519
            }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3520
            String stringToSub = bufferToSub.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3521
            String pattern = bufferToPat.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3522
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3523
            // Place sub string into working string at random index
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3524
            baseBuffer.append(stringToSub);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3525
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3526
            // Append random chars to end
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3527
            int trailingChars = generator.nextInt(10);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3528
            String trailingString = getRandomAlphaString(trailingChars);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3529
            baseBuffer.append(trailingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3530
            String baseString = baseBuffer.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3531
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3532
            // Create test pattern and matcher
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3533
            Pattern p = Pattern.compile(pattern);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3534
            Matcher m = p.matcher(baseString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3535
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3536
            // Reject candidate if pattern happens to start early
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3537
            m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3538
            if (m.start() < leadingChars)
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3539
                continue;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3540
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3541
            // Reject candidate if more than one match
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3542
            if (m.find())
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3543
                continue;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3544
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3545
            // Construct a replacement string with :
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3546
            // random group + random string + random group
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3547
            StringBuilder bufferToRep = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3548
            int groupIndex1 = generator.nextInt(5);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3549
            bufferToRep.append("$" + (groupIndex1 + 1));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3550
            String randomMidString = getRandomAlphaString(5);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3551
            bufferToRep.append(randomMidString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3552
            int groupIndex2 = generator.nextInt(5);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3553
            bufferToRep.append("$" + (groupIndex2 + 1));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3554
            String replacement = bufferToRep.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3555
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3556
            // Do the replacement
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3557
            String result = m.replaceAll(replacement);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3558
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3559
            // Construct expected result
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3560
            StringBuilder bufferToRes = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3561
            bufferToRes.append(leadingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3562
            bufferToRes.append(groups[groupIndex1]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3563
            bufferToRes.append(randomMidString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3564
            bufferToRes.append(groups[groupIndex2]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3565
            bufferToRes.append(trailingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3566
            String expectedResult = bufferToRes.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3567
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3568
            // Check results
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3569
            if (!result.equals(expectedResult)) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3570
                failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3571
            }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3572
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3573
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3574
        report("Substitution Basher 2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3575
    }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3576
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3577
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3578
     * Checks the handling of some escape sequences that the Pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3579
     * class should process instead of the java compiler. These are
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3580
     * not in the file because the escapes should be be processed
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3581
     * by the Pattern class when the regex is compiled.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3582
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3583
    private static void escapes() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3584
        Pattern p = Pattern.compile("\\043");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3585
        Matcher m = p.matcher("#");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3586
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3587
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3588
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3589
        p = Pattern.compile("\\x23");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3590
        m = p.matcher("#");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3591
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3592
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3593
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3594
        p = Pattern.compile("\\u0023");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3595
        m = p.matcher("#");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3596
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3597
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3598
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3599
        report("Escape sequences");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3600
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3601
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3602
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3603
     * Checks the handling of blank input situations. These
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3604
     * tests are incompatible with my test file format.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3605
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3606
    private static void blankInput() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3607
        Pattern p = Pattern.compile("abc", Pattern.CASE_INSENSITIVE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3608
        Matcher m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3609
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3610
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3611
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3612
        p = Pattern.compile("a*", Pattern.CASE_INSENSITIVE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3613
        m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3614
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3615
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3616
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3617
        p = Pattern.compile("abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3618
        m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3619
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3620
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3621
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3622
        p = Pattern.compile("a*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3623
        m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3624
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3625
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3626
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3627
        report("Blank input");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3628
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3629
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3630
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3631
     * Tests the Boyer-Moore pattern matching of a character sequence
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3632
     * on randomly generated patterns.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3633
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3634
    private static void bm() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3635
        doBnM('a');
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3636
        report("Boyer Moore (ASCII)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3637
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3638
        doBnM(Character.MIN_SUPPLEMENTARY_CODE_POINT - 10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3639
        report("Boyer Moore (Supplementary)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3640
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3641
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3642
    private static void doBnM(int baseCharacter) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3643
        int achar=0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3644
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3645
        for (int i=0; i<100; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3646
            // Create a short pattern to search for
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3647
            int patternLength = generator.nextInt(7) + 4;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3648
            StringBuffer patternBuffer = new StringBuffer(patternLength);
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3649
            String pattern;
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3650
            retry: for (;;) {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3651
                for (int x=0; x<patternLength; x++) {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3652
                    int ch = baseCharacter + generator.nextInt(26);
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3653
                    if (Character.isSupplementaryCodePoint(ch)) {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3654
                        patternBuffer.append(Character.toChars(ch));
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3655
                    } else {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3656
                        patternBuffer.append((char)ch);
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3657
                    }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3658
                }
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3659
                pattern = patternBuffer.toString();
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3660
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3661
                // Avoid patterns that start and end with the same substring
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3662
                // See JDK-6854417
34436
33c20335507c 8143854: java/util/regex/RegExTest.java.RegExTest failed
sherman
parents: 31645
diff changeset
  3663
                for (int x=1; x < pattern.length(); x++) {
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3664
                    if (pattern.startsWith(pattern.substring(x)))
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3665
                        continue retry;
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3666
                }
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3667
                break;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3668
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3669
            Pattern p = Pattern.compile(pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3670
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3671
            // Create a buffer with random ASCII chars that does
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3672
            // not match the sample
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3673
            String toSearch = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3674
            StringBuffer s = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3675
            Matcher m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3676
            do {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3677
                s = new StringBuffer(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3678
                for (int x=0; x<100; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3679
                    int ch = baseCharacter + generator.nextInt(26);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3680
                    if (Character.isSupplementaryCodePoint(ch)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3681
                        s.append(Character.toChars(ch));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3682
                    } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3683
                        s.append((char)ch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3684
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3685
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3686
                toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3687
                m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3688
            } while (m.find());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3689
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3690
            // Insert the pattern at a random spot
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3691
            int insertIndex = generator.nextInt(99);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3692
            if (Character.isLowSurrogate(s.charAt(insertIndex)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3693
                insertIndex++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3694
            s = s.insert(insertIndex, pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3695
            toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3696
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3697
            // Make sure that the pattern is found
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3698
            m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3699
            if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3700
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3701
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3702
            // Make sure that the match text is the pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3703
            if (!m.group().equals(pattern))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3704
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3705
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3706
            // Make sure match occured at insertion point
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3707
            if (m.start() != insertIndex)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3708
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3709
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3710
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3711
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3712
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3713
     * Tests the matching of slices on randomly generated patterns.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3714
     * The Boyer-Moore optimization is not done on these patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3715
     * because it uses unicode case folding.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3716
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3717
    private static void slice() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3718
        doSlice(Character.MAX_VALUE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3719
        report("Slice");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3720
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3721
        doSlice(Character.MAX_CODE_POINT);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3722
        report("Slice (Supplementary)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3723
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3724
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3725
    private static void doSlice(int maxCharacter) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3726
        Random generator = new Random();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3727
        int achar=0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3728
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3729
        for (int i=0; i<100; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3730
            // Create a short pattern to search for
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3731
            int patternLength = generator.nextInt(7) + 4;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3732
            StringBuffer patternBuffer = new StringBuffer(patternLength);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3733
            for (int x=0; x<patternLength; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3734
                int randomChar = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3735
                while (!Character.isLetterOrDigit(randomChar))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3736
                    randomChar = generator.nextInt(maxCharacter);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3737
                if (Character.isSupplementaryCodePoint(randomChar)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3738
                    patternBuffer.append(Character.toChars(randomChar));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3739
                } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3740
                    patternBuffer.append((char) randomChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3741
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3742
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3743
            String pattern =  patternBuffer.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3744
            Pattern p = Pattern.compile(pattern, Pattern.UNICODE_CASE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3745
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3746
            // Create a buffer with random chars that does not match the sample
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3747
            String toSearch = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3748
            StringBuffer s = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3749
            Matcher m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3750
            do {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3751
                s = new StringBuffer(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3752
                for (int x=0; x<100; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3753
                    int randomChar = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3754
                    while (!Character.isLetterOrDigit(randomChar))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3755
                        randomChar = generator.nextInt(maxCharacter);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3756
                    if (Character.isSupplementaryCodePoint(randomChar)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3757
                        s.append(Character.toChars(randomChar));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3758
                    } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3759
                        s.append((char) randomChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3760
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3761
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3762
                toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3763
                m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3764
            } while (m.find());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3765
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3766
            // Insert the pattern at a random spot
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3767
            int insertIndex = generator.nextInt(99);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3768
            if (Character.isLowSurrogate(s.charAt(insertIndex)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3769
                insertIndex++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3770
            s = s.insert(insertIndex, pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3771
            toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3772
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3773
            // Make sure that the pattern is found
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3774
            m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3775
            if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3776
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3777
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3778
            // Make sure that the match text is the pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3779
            if (!m.group().equals(pattern))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3780
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3781
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3782
            // Make sure match occured at insertion point
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3783
            if (m.start() != insertIndex)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3784
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3785
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3786
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3787
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3788
    private static void explainFailure(String pattern, String data,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3789
                                       String expected, String actual) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3790
        System.err.println("----------------------------------------");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3791
        System.err.println("Pattern = "+pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3792
        System.err.println("Data = "+data);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3793
        System.err.println("Expected = " + expected);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3794
        System.err.println("Actual   = " + actual);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3795
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3796
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3797
    private static void explainFailure(String pattern, String data,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3798
                                       Throwable t) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3799
        System.err.println("----------------------------------------");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3800
        System.err.println("Pattern = "+pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3801
        System.err.println("Data = "+data);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3802
        t.printStackTrace(System.err);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3803
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3804
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3805
    // Testing examples from a file
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3806
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3807
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3808
     * Goes through the file "TestCases.txt" and creates many patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3809
     * described in the file, matching the patterns against input lines in
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3810
     * the file, and comparing the results against the correct results
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3811
     * also found in the file. The file format is described in comments
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3812
     * at the head of the file.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3813
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3814
    private static void processFile(String fileName) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3815
        File testCases = new File(System.getProperty("test.src", "."),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3816
                                  fileName);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3817
        FileInputStream in = new FileInputStream(testCases);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3818
        BufferedReader r = new BufferedReader(new InputStreamReader(in));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3819
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3820
        // Process next test case.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3821
        String aLine;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3822
        while((aLine = r.readLine()) != null) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3823
            // Read a line for pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3824
            String patternString = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3825
            Pattern p = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3826
            try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3827
                p = compileTestPattern(patternString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3828
            } catch (PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3829
                String dataString = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3830
                String expectedResult = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3831
                if (expectedResult.startsWith("error"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3832
                    continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3833
                explainFailure(patternString, dataString, e);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3834
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3835
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3836
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3837
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3838
            // Read a line for input string
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3839
            String dataString = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3840
            Matcher m = p.matcher(dataString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3841
            StringBuffer result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3842
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3843
            // Check for IllegalStateExceptions before a match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3844
            failCount += preMatchInvariants(m);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3845
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3846
            boolean found = m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3847
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3848
            if (found)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3849
                failCount += postTrueMatchInvariants(m);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3850
            else
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3851
                failCount += postFalseMatchInvariants(m);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3852
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3853
            if (found) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3854
                result.append("true ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3855
                result.append(m.group(0) + " ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3856
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3857
                result.append("false ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3858
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3859
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3860
            result.append(m.groupCount());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3861
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3862
            if (found) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3863
                for (int i=1; i<m.groupCount()+1; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3864
                    if (m.group(i) != null)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3865
                        result.append(" " +m.group(i));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3866
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3867
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3868
            // Read a line for the expected result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3869
            String expectedResult = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3870
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3871
            if (!result.toString().equals(expectedResult)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3872
                explainFailure(patternString, dataString, expectedResult, result.toString());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3873
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3874
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3875
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3876
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3877
        report(fileName);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3878
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3879
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3880
    private static int preMatchInvariants(Matcher m) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3881
        int failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3882
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3883
            m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3884
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3885
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3886
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3887
            m.end();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3888
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3889
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3890
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3891
            m.group();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3892
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3893
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3894
        return failCount;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3895
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3896
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3897
    private static int postFalseMatchInvariants(Matcher m) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3898
        int failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3899
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3900
            m.group();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3901
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3902
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3903
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3904
            m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3905
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3906
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3907
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3908
            m.end();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3909
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3910
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3911
        return failCount;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3912
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3913
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3914
    private static int postTrueMatchInvariants(Matcher m) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3915
        int failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3916
        //assert(m.start() = m.start(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3917
        if (m.start() != m.start(0))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3918
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3919
        //assert(m.end() = m.end(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3920
        if (m.start() != m.start(0))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3921
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3922
        //assert(m.group() = m.group(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3923
        if (!m.group().equals(m.group(0)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3924
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3925
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3926
            m.group(50);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3927
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3928
        } catch (IndexOutOfBoundsException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3929
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3930
        return failCount;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3931
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3932
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3933
    private static Pattern compileTestPattern(String patternString) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3934
        if (!patternString.startsWith("'")) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3935
            return Pattern.compile(patternString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3936
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3937
        int break1 = patternString.lastIndexOf("'");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3938
        String flagString = patternString.substring(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3939
                                          break1+1, patternString.length());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3940
        patternString = patternString.substring(1, break1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3941
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3942
        if (flagString.equals("i"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3943
            return Pattern.compile(patternString, Pattern.CASE_INSENSITIVE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3944
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3945
        if (flagString.equals("m"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3946
            return Pattern.compile(patternString, Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3947
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3948
        return Pattern.compile(patternString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3949
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3950
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3951
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3952
     * Reads a line from the input file. Keeps reading lines until a non
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3953
     * empty non comment line is read. If the line contains a \n then
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3954
     * these two characters are replaced by a newline char. If a \\uxxxx
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3955
     * sequence is read then the sequence is replaced by the unicode char.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3956
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3957
    private static String grabLine(BufferedReader r) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3958
        int index = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3959
        String line = r.readLine();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3960
        while (line.startsWith("//") || line.length() < 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3961
            line = r.readLine();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3962
        while ((index = line.indexOf("\\n")) != -1) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3963
            StringBuffer temp = new StringBuffer(line);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3964
            temp.replace(index, index+2, "\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3965
            line = temp.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3966
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3967
        while ((index = line.indexOf("\\u")) != -1) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3968
            StringBuffer temp = new StringBuffer(line);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3969
            String value = temp.substring(index+2, index+6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3970
            char aChar = (char)Integer.parseInt(value, 16);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3971
            String unicodeChar = "" + aChar;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3972
            temp.replace(index, index+6, unicodeChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3973
            line = temp.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3974
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3975
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3976
        return line;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3977
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3978
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3979
    private static void check(Pattern p, String s, String g, String expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3980
        Matcher m = p.matcher(s);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3981
        m.find();
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3982
        if (!m.group(g).equals(expected) ||
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3983
            s.charAt(m.start(g)) != expected.charAt(0) ||
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3984
            s.charAt(m.end(g) - 1) != expected.charAt(expected.length() - 1))
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3985
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3986
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3987
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3988
    private static void checkReplaceFirst(String p, String s, String r, String expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3989
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3990
        if (!expected.equals(Pattern.compile(p)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3991
                                    .matcher(s)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3992
                                    .replaceFirst(r)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3993
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3994
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3995
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3996
    private static void checkReplaceAll(String p, String s, String r, String expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3997
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3998
        if (!expected.equals(Pattern.compile(p)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3999
                                    .matcher(s)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4000
                                    .replaceAll(r)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4001
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4002
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4003
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4004
    private static void checkExpectedFail(String p) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4005
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4006
            Pattern.compile(p);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4007
        } catch (PatternSyntaxException pse) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4008
            //pse.printStackTrace();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4009
            return;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4010
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4011
        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4012
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4013
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4014
    private static void checkExpectedIAE(Matcher m, String g) {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4015
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4016
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4017
            m.group(g);
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4018
        } catch (IllegalArgumentException x) {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4019
            //iae.printStackTrace();
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4020
            try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4021
                m.start(g);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4022
            } catch (IllegalArgumentException xx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4023
                try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4024
                    m.start(g);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4025
                } catch (IllegalArgumentException xxx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4026
                    return;
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4027
                }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4028
            }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4029
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4030
        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4031
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4032
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4033
    private static void checkExpectedNPE(Matcher m) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4034
        m.find();
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4035
        try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4036
            m.group(null);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4037
        } catch (NullPointerException x) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4038
            try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4039
                m.start(null);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4040
            } catch (NullPointerException xx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4041
                try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4042
                    m.end(null);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4043
                } catch (NullPointerException xxx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4044
                    return;
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4045
                }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4046
            }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4047
        }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4048
        failCount++;
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4049
    }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4050
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4051
    private static void namedGroupCaptureTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4052
        check(Pattern.compile("x+(?<gname>y+)z+"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4053
              "xxxyyyzzz",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4054
              "gname",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4055
              "yyy");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4056
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4057
        check(Pattern.compile("x+(?<gname8>y+)z+"),
2290
3a3bde061968 6817475: named-capturing group name started with digit causes PSE exception
sherman
parents: 2070
diff changeset
  4058
              "xxxyyyzzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4059
              "gname8",
2290
3a3bde061968 6817475: named-capturing group name started with digit causes PSE exception
sherman
parents: 2070
diff changeset
  4060
              "yyy");
3a3bde061968 6817475: named-capturing group name started with digit causes PSE exception
sherman
parents: 2070
diff changeset
  4061
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4062
        //backref
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4063
        Pattern pattern = Pattern.compile("(a*)bc\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4064
        check(pattern, "zzzaabcazzz", true);  // found "abca"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4065
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4066
        check(Pattern.compile("(?<gname>a*)bc\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4067
              "zzzaabcaazzz", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4068
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4069
        check(Pattern.compile("(?<gname>abc)(def)\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4070
              "abcdefabc", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4071
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4072
        check(Pattern.compile("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)(?<gname>k)\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4073
              "abcdefghijkk", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4074
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4075
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4076
        check(Pattern.compile("(?<gname>" + toSupplementaries("a*)bc") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4077
              toSupplementaries("zzzaabcazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4078
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4079
        check(Pattern.compile("(?<gname>" + toSupplementaries("a*)bc") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4080
              toSupplementaries("zzzaabcaazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4081
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4082
        check(Pattern.compile("(?<gname>" + toSupplementaries("abc)(def)") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4083
              toSupplementaries("abcdefabc"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4084
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4085
        check(Pattern.compile(toSupplementaries("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4086
                              "(?<gname>" +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4087
                              toSupplementaries("k)") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4088
              toSupplementaries("abcdefghijkk"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4089
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4090
        check(Pattern.compile("x+(?<gname>y+)z+\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4091
              "xxxyyyzzzyyy",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4092
              "gname",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4093
              "yyy");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4094
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4095
        //replaceFirst/All
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4096
        checkReplaceFirst("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4097
                          "abccczzzabcczzzabccc",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4098
                          "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4099
                          "abzzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4100
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4101
        checkReplaceAll("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4102
                        "abccczzzabcczzzabccc",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4103
                        "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4104
                        "abzzzabzzzab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4105
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4106
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4107
        checkReplaceFirst("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4108
                          "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4109
                          "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4110
                          "zzzabzzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4111
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4112
        checkReplaceAll("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4113
                        "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4114
                        "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4115
                        "zzzabzzzabzzzabzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4116
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4117
        checkReplaceFirst("(?<gn1>ab)(?<gn2>c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4118
                          "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4119
                          "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4120
                          "zzzccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4121
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4122
        checkReplaceAll("(?<gn1>ab)(?<gn2>c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4123
                        "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4124
                        "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4125
                        "zzzccczzzcczzzccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4126
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4127
        //toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4128
        checkReplaceFirst("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4129
                           ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4130
                          toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4131
                          "${gn1}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4132
                          toSupplementaries("abzzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4133
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4134
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4135
        checkReplaceAll("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4136
                        ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4137
                        toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4138
                        "${gn1}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4139
                        toSupplementaries("abzzzabzzzab"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4140
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4141
        checkReplaceFirst("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4142
                           ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4143
                          toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4144
                          "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4145
                          toSupplementaries("ccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4146
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4147
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4148
        checkReplaceAll("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4149
                        ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4150
                        toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4151
                        "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4152
                        toSupplementaries("ccczzzcczzzccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4153
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4154
        checkReplaceFirst("(?<dog>Dog)AndCat",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4155
                          "zzzDogAndCatzzzDogAndCatzzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4156
                          "${dog}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4157
                          "zzzDogzzzDogAndCatzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4158
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4159
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4160
        checkReplaceAll("(?<dog>Dog)AndCat",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4161
                          "zzzDogAndCatzzzDogAndCatzzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4162
                          "${dog}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4163
                          "zzzDogzzzDogzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4164
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4165
        // backref in Matcher & String
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4166
        if (!"abcdefghij".replaceFirst("cd(?<gn>ef)gh", "${gn}").equals("abefij") ||
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4167
            !"abbbcbdbefgh".replaceAll("(?<gn>[a-e])b", "${gn}").equals("abcdefgh"))
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4168
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4169
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4170
        // negative
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4171
        checkExpectedFail("(?<groupnamehasnoascii.in>abc)(def)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4172
        checkExpectedFail("(?<groupnamehasnoascii_in>abc)(def)");
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4173
        checkExpectedFail("(?<6groupnamestartswithdigit>abc)(def)");
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4174
        checkExpectedFail("(?<gname>abc)(def)\\k<gnameX>");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4175
        checkExpectedFail("(?<gname>abc)(?<gname>def)\\k<gnameX>");
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4176
        checkExpectedIAE(Pattern.compile("(?<gname>abc)(def)").matcher("abcdef"),
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4177
                         "gnameX");
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4178
        checkExpectedNPE(Pattern.compile("(?<gname>abc)(def)").matcher("abcdef"));
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4179
        report("NamedGroupCapture");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4180
    }
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4181
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4182
    // This is for bug 6919132
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4183
    private static void nonBmpClassComplementTest() throws Exception {
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4184
        Pattern p = Pattern.compile("\\P{Lu}");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4185
        Matcher m = p.matcher(new String(new int[] {0x1d400}, 0, 1));
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4186
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4187
        if (m.find() && m.start() == 1)
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4188
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4189
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4190
        // from a unicode category
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4191
        p = Pattern.compile("\\P{Lu}");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4192
        m = p.matcher(new String(new int[] {0x1d400}, 0, 1));
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4193
        if (m.find())
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4194
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4195
        if (!m.hitEnd())
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4196
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4197
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4198
        // block
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4199
        p = Pattern.compile("\\P{InMathematicalAlphanumericSymbols}");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4200
        m = p.matcher(new String(new int[] {0x1d400}, 0, 1));
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4201
        if (m.find() && m.start() == 1)
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4202
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4203
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4204
        p = Pattern.compile("\\P{sc=GRANTHA}");
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4205
        m = p.matcher(new String(new int[] {0x11350}, 0, 1));
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4206
        if (m.find() && m.start() == 1)
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4207
            failCount++;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4208
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4209
        report("NonBmpClassComplement");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4210
    }
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4211
5610
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4212
    private static void unicodePropertiesTest() throws Exception {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4213
        // different forms
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4214
        if (!Pattern.compile("\\p{IsLu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4215
            !Pattern.compile("\\p{Lu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4216
            !Pattern.compile("\\p{gc=Lu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4217
            !Pattern.compile("\\p{general_category=Lu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4218
            !Pattern.compile("\\p{IsLatin}").matcher("B").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4219
            !Pattern.compile("\\p{sc=Latin}").matcher("B").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4220
            !Pattern.compile("\\p{script=Latin}").matcher("B").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4221
            !Pattern.compile("\\p{InBasicLatin}").matcher("c").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4222
            !Pattern.compile("\\p{blk=BasicLatin}").matcher("c").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4223
            !Pattern.compile("\\p{block=BasicLatin}").matcher("c").matches())
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4224
            failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4225
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4226
        Matcher common  = Pattern.compile("\\p{script=Common}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4227
        Matcher unknown = Pattern.compile("\\p{IsUnknown}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4228
        Matcher lastSM  = common;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4229
        Character.UnicodeScript lastScript = Character.UnicodeScript.of(0);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4230
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4231
        Matcher latin  = Pattern.compile("\\p{block=basic_latin}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4232
        Matcher greek  = Pattern.compile("\\p{InGreek}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4233
        Matcher lastBM = latin;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4234
        Character.UnicodeBlock lastBlock = Character.UnicodeBlock.of(0);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4235
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4236
        for (int cp = 1; cp < Character.MAX_CODE_POINT; cp++) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4237
            if (cp >= 0x30000 && (cp & 0x70) == 0){
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4238
                continue;  // only pick couple code points, they are the same
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4239
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4240
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4241
            // Unicode Script
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4242
            Character.UnicodeScript script = Character.UnicodeScript.of(cp);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4243
            Matcher m;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4244
            String str = new String(Character.toChars(cp));
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4245
            if (script == lastScript) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4246
                 m = lastSM;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4247
                 m.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4248
            } else {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4249
                 m  = Pattern.compile("\\p{Is" + script.name() + "}").matcher(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4250
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4251
            if (!m.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4252
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4253
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4254
            Matcher other = (script == Character.UnicodeScript.COMMON)? unknown : common;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4255
            other.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4256
            if (other.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4257
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4258
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4259
            lastSM = m;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4260
            lastScript = script;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4261
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4262
            // Unicode Block
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4263
            Character.UnicodeBlock block = Character.UnicodeBlock.of(cp);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4264
            if (block == null) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4265
                //System.out.printf("Not a Block: cp=%x%n", cp);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4266
                continue;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4267
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4268
            if (block == lastBlock) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4269
                 m = lastBM;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4270
                 m.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4271
            } else {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4272
                 m  = Pattern.compile("\\p{block=" + block.toString() + "}").matcher(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4273
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4274
            if (!m.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4275
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4276
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4277
            other = (block == Character.UnicodeBlock.BASIC_LATIN)? greek : latin;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4278
            other.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4279
            if (other.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4280
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4281
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4282
            lastBM = m;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4283
            lastBlock = block;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4284
        }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4285
        report("unicodeProperties");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4286
    }
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4287
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4288
    private static void unicodeHexNotationTest() throws Exception {
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4289
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4290
        // negative
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4291
        checkExpectedFail("\\x{-23}");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4292
        checkExpectedFail("\\x{110000}");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4293
        checkExpectedFail("\\x{}");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4294
        checkExpectedFail("\\x{AB[ef]");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4295
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4296
        // codepoint
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4297
        check("^\\x{1033c}$",              "\uD800\uDF3C", true);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4298
        check("^\\xF0\\x90\\x8C\\xBC$",    "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4299
        check("^\\x{D800}\\x{DF3c}+$",     "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4300
        check("^\\xF0\\x90\\x8C\\xBC$",    "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4301
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4302
        // in class
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4303
        check("^[\\x{D800}\\x{DF3c}]+$",   "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4304
        check("^[\\xF0\\x90\\x8C\\xBC]+$", "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4305
        check("^[\\x{D800}\\x{DF3C}]+$",   "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4306
        check("^[\\x{DF3C}\\x{D800}]+$",   "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4307
        check("^[\\x{D800}\\x{DF3C}]+$",   "\uDF3C\uD800", true);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4308
        check("^[\\x{DF3C}\\x{D800}]+$",   "\uDF3C\uD800", true);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4309
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4310
        for (int cp = 0; cp <= 0x10FFFF; cp++) {
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4311
             String s = "A" + new String(Character.toChars(cp)) + "B";
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4312
             String hexUTF16 = (cp <= 0xFFFF)? String.format("\\u%04x", cp)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4313
                                             : String.format("\\u%04x\\u%04x",
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4314
                                               (int) Character.toChars(cp)[0],
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4315
                                               (int) Character.toChars(cp)[1]);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4316
             String hexCodePoint = "\\x{" + Integer.toHexString(cp) + "}";
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4317
             if (!Pattern.matches("A" + hexUTF16 + "B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4318
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4319
             if (!Pattern.matches("A[" + hexUTF16 + "]B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4320
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4321
             if (!Pattern.matches("A" + hexCodePoint + "B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4322
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4323
             if (!Pattern.matches("A[" + hexCodePoint + "]B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4324
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4325
         }
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4326
         report("unicodeHexNotation");
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4327
    }
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4328
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4329
    private static void unicodeClassesTest() throws Exception {
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4330
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4331
        Matcher lower  = Pattern.compile("\\p{Lower}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4332
        Matcher upper  = Pattern.compile("\\p{Upper}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4333
        Matcher ASCII  = Pattern.compile("\\p{ASCII}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4334
        Matcher alpha  = Pattern.compile("\\p{Alpha}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4335
        Matcher digit  = Pattern.compile("\\p{Digit}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4336
        Matcher alnum  = Pattern.compile("\\p{Alnum}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4337
        Matcher punct  = Pattern.compile("\\p{Punct}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4338
        Matcher graph  = Pattern.compile("\\p{Graph}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4339
        Matcher print  = Pattern.compile("\\p{Print}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4340
        Matcher blank  = Pattern.compile("\\p{Blank}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4341
        Matcher cntrl  = Pattern.compile("\\p{Cntrl}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4342
        Matcher xdigit = Pattern.compile("\\p{XDigit}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4343
        Matcher space  = Pattern.compile("\\p{Space}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4344
        Matcher bound  = Pattern.compile("\\b").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4345
        Matcher word   = Pattern.compile("\\w++").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4346
        // UNICODE_CHARACTER_CLASS
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4347
        Matcher lowerU  = Pattern.compile("\\p{Lower}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4348
        Matcher upperU  = Pattern.compile("\\p{Upper}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4349
        Matcher ASCIIU  = Pattern.compile("\\p{ASCII}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4350
        Matcher alphaU  = Pattern.compile("\\p{Alpha}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4351
        Matcher digitU  = Pattern.compile("\\p{Digit}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4352
        Matcher alnumU  = Pattern.compile("\\p{Alnum}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4353
        Matcher punctU  = Pattern.compile("\\p{Punct}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4354
        Matcher graphU  = Pattern.compile("\\p{Graph}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4355
        Matcher printU  = Pattern.compile("\\p{Print}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4356
        Matcher blankU  = Pattern.compile("\\p{Blank}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4357
        Matcher cntrlU  = Pattern.compile("\\p{Cntrl}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4358
        Matcher xdigitU = Pattern.compile("\\p{XDigit}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4359
        Matcher spaceU  = Pattern.compile("\\p{Space}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4360
        Matcher boundU  = Pattern.compile("\\b", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4361
        Matcher wordU   = Pattern.compile("\\w", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4362
        // embedded flag (?U)
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4363
        Matcher lowerEU  = Pattern.compile("(?U)\\p{Lower}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4364
        Matcher graphEU  = Pattern.compile("(?U)\\p{Graph}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4365
        Matcher wordEU   = Pattern.compile("(?U)\\w", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4366
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4367
        Matcher bwb    = Pattern.compile("\\b\\w\\b").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4368
        Matcher bwbU   = Pattern.compile("\\b\\w++\\b", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4369
        Matcher bwbEU  = Pattern.compile("(?U)\\b\\w++\\b", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4370
        // properties
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4371
        Matcher lowerP  = Pattern.compile("\\p{IsLowerCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4372
        Matcher upperP  = Pattern.compile("\\p{IsUpperCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4373
        Matcher titleP  = Pattern.compile("\\p{IsTitleCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4374
        Matcher letterP = Pattern.compile("\\p{IsLetter}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4375
        Matcher alphaP  = Pattern.compile("\\p{IsAlphabetic}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4376
        Matcher ideogP  = Pattern.compile("\\p{IsIdeographic}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4377
        Matcher cntrlP  = Pattern.compile("\\p{IsControl}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4378
        Matcher spaceP  = Pattern.compile("\\p{IsWhiteSpace}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4379
        Matcher definedP = Pattern.compile("\\p{IsAssigned}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4380
        Matcher nonCCPP = Pattern.compile("\\p{IsNoncharacterCodePoint}").matcher("");
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4381
        Matcher joinCrtl = Pattern.compile("\\p{IsJoinControl}").matcher("");
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4382
        // javaMethod
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4383
        Matcher lowerJ  = Pattern.compile("\\p{javaLowerCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4384
        Matcher upperJ  = Pattern.compile("\\p{javaUpperCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4385
        Matcher alphaJ  = Pattern.compile("\\p{javaAlphabetic}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4386
        Matcher ideogJ  = Pattern.compile("\\p{javaIdeographic}").matcher("");
38450
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4387
        // GC/C
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4388
        Matcher gcC  = Pattern.compile("\\p{C}").matcher("");
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4389
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4390
        for (int cp = 1; cp < 0x30000; cp++) {
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4391
            String str = new String(Character.toChars(cp));
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4392
            int type = Character.getType(cp);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4393
            if (// lower
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4394
                POSIX_ASCII.isLower(cp)   != lower.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4395
                Character.isLowerCase(cp) != lowerU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4396
                Character.isLowerCase(cp) != lowerP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4397
                Character.isLowerCase(cp) != lowerEU.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4398
                Character.isLowerCase(cp) != lowerJ.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4399
                // upper
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4400
                POSIX_ASCII.isUpper(cp)   != upper.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4401
                POSIX_Unicode.isUpper(cp) != upperU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4402
                Character.isUpperCase(cp) != upperP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4403
                Character.isUpperCase(cp) != upperJ.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4404
                // alpha
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4405
                POSIX_ASCII.isAlpha(cp)   != alpha.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4406
                POSIX_Unicode.isAlpha(cp) != alphaU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4407
                Character.isAlphabetic(cp)!= alphaP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4408
                Character.isAlphabetic(cp)!= alphaJ.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4409
                // digit
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4410
                POSIX_ASCII.isDigit(cp)   != digit.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4411
                Character.isDigit(cp)     != digitU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4412
                // alnum
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4413
                POSIX_ASCII.isAlnum(cp)   != alnum.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4414
                POSIX_Unicode.isAlnum(cp) != alnumU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4415
                // punct
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4416
                POSIX_ASCII.isPunct(cp)   != punct.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4417
                POSIX_Unicode.isPunct(cp) != punctU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4418
                // graph
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4419
                POSIX_ASCII.isGraph(cp)   != graph.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4420
                POSIX_Unicode.isGraph(cp) != graphU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4421
                POSIX_Unicode.isGraph(cp) != graphEU.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4422
                // blank
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4423
                POSIX_ASCII.isType(cp, POSIX_ASCII.BLANK)
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4424
                                          != blank.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4425
                POSIX_Unicode.isBlank(cp) != blankU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4426
                // print
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4427
                POSIX_ASCII.isPrint(cp)   != print.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4428
                POSIX_Unicode.isPrint(cp) != printU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4429
                // cntrl
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4430
                POSIX_ASCII.isCntrl(cp)   != cntrl.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4431
                POSIX_Unicode.isCntrl(cp) != cntrlU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4432
                (Character.CONTROL == type) != cntrlP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4433
                // hexdigit
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4434
                POSIX_ASCII.isHexDigit(cp)   != xdigit.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4435
                POSIX_Unicode.isHexDigit(cp) != xdigitU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4436
                // space
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4437
                POSIX_ASCII.isSpace(cp)   != space.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4438
                POSIX_Unicode.isSpace(cp) != spaceU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4439
                POSIX_Unicode.isSpace(cp) != spaceP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4440
                // word
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4441
                POSIX_ASCII.isWord(cp)   != word.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4442
                POSIX_Unicode.isWord(cp) != wordU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4443
                POSIX_Unicode.isWord(cp) != wordEU.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4444
                // bwordb
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4445
                POSIX_ASCII.isWord(cp) != bwb.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4446
                POSIX_Unicode.isWord(cp) != bwbU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4447
                // properties
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4448
                Character.isTitleCase(cp) != titleP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4449
                Character.isLetter(cp)    != letterP.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4450
                Character.isIdeographic(cp) != ideogP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4451
                Character.isIdeographic(cp) != ideogJ.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4452
                (Character.UNASSIGNED == type) == definedP.reset(str).matches() ||
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4453
                POSIX_Unicode.isNoncharacterCodePoint(cp) != nonCCPP.reset(str).matches() ||
38450
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4454
                POSIX_Unicode.isJoinControl(cp) != joinCrtl.reset(str).matches() ||
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4455
                // gc_C
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4456
                (Character.CONTROL == type || Character.FORMAT == type ||
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4457
                 Character.PRIVATE_USE == type || Character.SURROGATE == type ||
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4458
                 Character.UNASSIGNED == type)
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4459
                != gcC.reset(str).matches()) {
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4460
                failCount++;
38450
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4461
            }
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4462
        }
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4463
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4464
        // bounds/word align
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4465
        twoFindIndexes(" \u0180sherman\u0400 ", bound, 1, 10);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4466
        if (!bwbU.reset("\u0180sherman\u0400").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4467
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4468
        twoFindIndexes(" \u0180sh\u0345erman\u0400 ", bound, 1, 11);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4469
        if (!bwbU.reset("\u0180sh\u0345erman\u0400").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4470
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4471
        twoFindIndexes(" \u0724\u0739\u0724 ", bound, 1, 4);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4472
        if (!bwbU.reset("\u0724\u0739\u0724").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4473
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4474
        if (!bwbEU.reset("\u0724\u0739\u0724").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4475
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4476
        report("unicodePredefinedClasses");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4477
    }
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4478
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4479
    private static void unicodeCharacterNameTest() throws Exception {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4480
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4481
        for (int cp = 0; cp < Character.MAX_CODE_POINT; cp++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4482
            if (!Character.isValidCodePoint(cp) ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4483
                Character.getType(cp) == Character.UNASSIGNED)
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4484
                continue;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4485
            String str = new String(Character.toChars(cp));
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4486
            // single
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4487
            String p = "\\N{" + Character.getName(cp) + "}";
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4488
            if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4489
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4490
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4491
            // class[c]
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4492
            p = "[\\N{" + Character.getName(cp) + "}]";
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4493
            if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4494
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4495
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4496
        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4497
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4498
        // range
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4499
        for (int i = 0; i < 10; i++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4500
            int start = generator.nextInt(20);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4501
            int end = start + generator.nextInt(200);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4502
            String p = "[\\N{" + Character.getName(start) + "}-\\N{" + Character.getName(end) + "}]";
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4503
            String str;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4504
            for (int cp = start; cp < end; cp++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4505
                str = new String(Character.toChars(cp));
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4506
                if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4507
                    failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4508
                }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4509
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4510
            str = new String(Character.toChars(end + 10));
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4511
            if (Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4512
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4513
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4514
        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4515
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4516
        // slice
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4517
        for (int i = 0; i < 10; i++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4518
            int n = generator.nextInt(256);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4519
            int[] buf = new int[n];
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4520
            StringBuffer sb = new StringBuffer(1024);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4521
            for (int j = 0; j < n; j++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4522
                int cp = generator.nextInt(1000);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4523
                if (!Character.isValidCodePoint(cp) ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4524
                    Character.getType(cp) == Character.UNASSIGNED)
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4525
                    cp = 0x4e00;    // just use 4e00
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4526
                sb.append("\\N{" + Character.getName(cp) + "}");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4527
                buf[j] = cp;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4528
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4529
            String p = sb.toString();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4530
            String str = new String(buf, 0, buf.length);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4531
            if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4532
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4533
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4534
        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4535
        report("unicodeCharacterName");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4536
    }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4537
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4538
    private static void horizontalAndVerticalWSTest() throws Exception {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4539
        String hws = new String (new char[] {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4540
                                     0x09, 0x20, 0xa0, 0x1680, 0x180e,
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4541
                                     0x2000, 0x2001, 0x2002, 0x2003, 0x2004, 0x2005,
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4542
                                     0x2006, 0x2007, 0x2008, 0x2009, 0x200a,
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4543
                                     0x202f, 0x205f, 0x3000 });
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4544
        String vws = new String (new char[] {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4545
                                     0x0a, 0x0b, 0x0c, 0x0d, 0x85, 0x2028, 0x2029 });
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4546
        if (!Pattern.compile("\\h+").matcher(hws).matches() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4547
            !Pattern.compile("[\\h]+").matcher(hws).matches())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4548
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4549
        if (Pattern.compile("\\H").matcher(hws).find() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4550
            Pattern.compile("[\\H]").matcher(hws).find())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4551
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4552
        if (!Pattern.compile("\\v+").matcher(vws).matches() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4553
            !Pattern.compile("[\\v]+").matcher(vws).matches())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4554
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4555
        if (Pattern.compile("\\V").matcher(vws).find() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4556
            Pattern.compile("[\\V]").matcher(vws).find())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4557
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4558
        String prefix = "abcd";
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4559
        String suffix = "efgh";
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4560
        String ng = "A";
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4561
        for (int i = 0; i < hws.length(); i++) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4562
            String c = String.valueOf(hws.charAt(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4563
            Matcher m = Pattern.compile("\\h").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4564
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4565
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4566
            m = Pattern.compile("[\\h]").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4567
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4568
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4569
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4570
            m = Pattern.compile("\\H").matcher(hws.substring(0, i) + ng + hws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4571
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4572
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4573
            m = Pattern.compile("[\\H]").matcher(hws.substring(0, i) + ng + hws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4574
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4575
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4576
        }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4577
        for (int i = 0; i < vws.length(); i++) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4578
            String c = String.valueOf(vws.charAt(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4579
            Matcher m = Pattern.compile("\\v").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4580
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4581
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4582
            m = Pattern.compile("[\\v]").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4583
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4584
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4585
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4586
            m = Pattern.compile("\\V").matcher(vws.substring(0, i) + ng + vws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4587
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4588
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4589
            m = Pattern.compile("[\\V]").matcher(vws.substring(0, i) + ng + vws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4590
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4591
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4592
        }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4593
        // \v in range is interpreted as 0x0B. This is the undocumented behavior
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4594
        if (!Pattern.compile("[\\v-\\v]").matcher(String.valueOf((char)0x0B)).matches())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4595
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4596
        report("horizontalAndVerticalWSTest");
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4597
    }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4598
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4599
    private static void linebreakTest() throws Exception {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4600
        String linebreaks = new String (new char[] {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4601
            0x0A, 0x0B, 0x0C, 0x0D, 0x85, 0x2028, 0x2029 });
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4602
        String crnl = "\r\n";
44122
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4603
        if (!(Pattern.compile("\\R+").matcher(linebreaks).matches() &&
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4604
              Pattern.compile("\\R").matcher(crnl).matches() &&
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4605
              Pattern.compile("\\Rabc").matcher(crnl + "abc").matches() &&
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4606
              Pattern.compile("\\Rabc").matcher("\rabc").matches() &&
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4607
              Pattern.compile("\\R\\R").matcher(crnl).matches() &&  // backtracking
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4608
              Pattern.compile("\\R\\n").matcher(crnl).matches()) && // backtracking
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4609
              !Pattern.compile("((?<!\\R)\\s)*").matcher(crnl).matches()) { // #8176029
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4610
            failCount++;
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4611
        }
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4612
        report("linebreakTest");
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4613
    }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4614
13554
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4615
    // #7189363
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4616
    private static void branchTest() throws Exception {
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4617
        if (!Pattern.compile("(a)?bc|d").matcher("d").find() ||     // greedy
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4618
            !Pattern.compile("(a)+bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4619
            !Pattern.compile("(a)*bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4620
            !Pattern.compile("(a)??bc|d").matcher("d").find() ||    // reluctant
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4621
            !Pattern.compile("(a)+?bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4622
            !Pattern.compile("(a)*?bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4623
            !Pattern.compile("(a)?+bc|d").matcher("d").find() ||    // possessive
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4624
            !Pattern.compile("(a)++bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4625
            !Pattern.compile("(a)*+bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4626
            !Pattern.compile("(a)?bc|d").matcher("d").matches() ||  // greedy
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4627
            !Pattern.compile("(a)+bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4628
            !Pattern.compile("(a)*bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4629
            !Pattern.compile("(a)??bc|d").matcher("d").matches() || // reluctant
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4630
            !Pattern.compile("(a)+?bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4631
            !Pattern.compile("(a)*?bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4632
            !Pattern.compile("(a)?+bc|d").matcher("d").matches() || // possessive
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4633
            !Pattern.compile("(a)++bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4634
            !Pattern.compile("(a)*+bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4635
            !Pattern.compile("(a)?bc|de").matcher("de").find() ||   // others
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4636
            !Pattern.compile("(a)??bc|de").matcher("de").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4637
            !Pattern.compile("(a)?bc|de").matcher("de").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4638
            !Pattern.compile("(a)??bc|de").matcher("de").matches())
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4639
            failCount++;
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4640
        report("branchTest");
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4641
    }
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4642
17183
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4643
    // This test is for 8007395
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4644
    private static void groupCurlyNotFoundSuppTest() throws Exception {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4645
        String input = "test this as \ud83d\ude0d";
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4646
        for (String pStr : new String[] { "test(.)+(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4647
                                          "test(.)*(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4648
                                          "test([^B])+(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4649
                                          "test([^B])*(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4650
                                          "test(\\P{IsControl})+(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4651
                                          "test(\\P{IsControl})*(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4652
                                        }) {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4653
            Matcher m = Pattern.compile(pStr, Pattern.CASE_INSENSITIVE)
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4654
                               .matcher(input);
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4655
            try {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4656
                if (m.find()) {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4657
                    failCount++;
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4658
                }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4659
            } catch (Exception x) {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4660
                failCount++;
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4661
            }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4662
        }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4663
        report("GroupCurly NotFoundSupp");
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4664
    }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4665
19604
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4666
    // This test is for 8023647
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4667
    private static void groupCurlyBackoffTest() throws Exception {
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4668
        if (!"abc1c".matches("(\\w)+1\\1") ||
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4669
            "abc11".matches("(\\w)+1\\1")) {
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4670
            failCount++;
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4671
        }
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4672
        report("GroupCurly backoff");
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4673
    }
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4674
17447
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4675
    // This test is for 8012646
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4676
    private static void patternAsPredicate() throws Exception {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4677
        Predicate<String> p = Pattern.compile("[a-z]+").asPredicate();
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4678
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4679
        if (p.test("")) {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4680
            failCount++;
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4681
        }
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4682
        if (!p.test("word")) {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4683
            failCount++;
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4684
        }
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4685
        if (p.test("1234")) {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4686
            failCount++;
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4687
        }
49554
f088ec60bed5 8164781: Pattern.asPredicate specification is incomplete
vtheeyarath
parents: 48853
diff changeset
  4688
        if (!p.test("word1234")) {
f088ec60bed5 8164781: Pattern.asPredicate specification is incomplete
vtheeyarath
parents: 48853
diff changeset
  4689
            failCount++;
f088ec60bed5 8164781: Pattern.asPredicate specification is incomplete
vtheeyarath
parents: 48853
diff changeset
  4690
        }
17447
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4691
        report("Pattern.asPredicate");
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4692
    }
25523
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4693
49763
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4694
    // This test is for 8184692
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4695
    private static void patternAsMatchPredicate() throws Exception {
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4696
        Predicate<String> p = Pattern.compile("[a-z]+").asMatchPredicate();
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4697
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4698
        if (p.test("")) {
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4699
            failCount++;
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4700
        }
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4701
        if (!p.test("word")) {
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4702
            failCount++;
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4703
        }
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4704
        if (p.test("1234word")) {
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4705
            failCount++;
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4706
        }
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4707
        if (p.test("1234")) {
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4708
            failCount++;
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4709
        }
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4710
        report("Pattern.asMatchPredicate");
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4711
    }
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4712
1ccf5fae9664 8184692: add Pattern.asMatchPredicate
vtheeyarath
parents: 49554
diff changeset
  4713
25523
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4714
    // This test is for 8035975
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4715
    private static void invalidFlags() throws Exception {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4716
        for (int flag = 1; flag != 0; flag <<= 1) {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4717
            switch (flag) {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4718
            case Pattern.CASE_INSENSITIVE:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4719
            case Pattern.MULTILINE:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4720
            case Pattern.DOTALL:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4721
            case Pattern.UNICODE_CASE:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4722
            case Pattern.CANON_EQ:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4723
            case Pattern.UNIX_LINES:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4724
            case Pattern.LITERAL:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4725
            case Pattern.UNICODE_CHARACTER_CLASS:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4726
            case Pattern.COMMENTS:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4727
                // valid flag, continue
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4728
                break;
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4729
            default:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4730
                try {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4731
                    Pattern.compile(".", flag);
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4732
                    failCount++;
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4733
                } catch (IllegalArgumentException expected) {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4734
                }
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4735
            }
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4736
        }
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4737
        report("Invalid compile flags");
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4738
    }
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4739
38777
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4740
    // This test is for 8158482
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4741
    private static void embeddedFlags() throws Exception {
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4742
        try {
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4743
            Pattern.compile("(?i).(?-i).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4744
            Pattern.compile("(?m).(?-m).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4745
            Pattern.compile("(?s).(?-s).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4746
            Pattern.compile("(?d).(?-d).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4747
            Pattern.compile("(?u).(?-u).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4748
            Pattern.compile("(?c).(?-c).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4749
            Pattern.compile("(?x).(?-x).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4750
            Pattern.compile("(?U).(?-U).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4751
            Pattern.compile("(?imsducxU).(?-imsducxU).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4752
        } catch (PatternSyntaxException x) {
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4753
            failCount++;
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4754
        }
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4755
        report("Embedded flags");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4756
    }
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4757
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4758
    private static void grapheme() throws Exception {
55013
8dae495a59e7 8221431: Support for Unicode 12.1
naoto
parents: 49763
diff changeset
  4759
        Files.lines(UCDFiles.GRAPHEME_BREAK_TEST)
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4760
            .filter( ln -> ln.length() != 0 && !ln.startsWith("#") )
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4761
            .forEach( ln -> {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4762
                    ln = ln.replaceAll("\\s+|\\([a-zA-Z]+\\)|\\[[a-zA-Z]]+\\]|#.*", "");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4763
                    // System.out.println(str);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4764
                    String[] strs = ln.split("\u00f7|\u00d7");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4765
                    StringBuilder src = new StringBuilder();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4766
                    ArrayList<String> graphemes = new ArrayList<>();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4767
                    StringBuilder buf = new StringBuilder();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4768
                    int offBk = 0;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4769
                    for (String str : strs) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4770
                        if (str.length() == 0)  // first empty str
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4771
                            continue;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4772
                        int cp = Integer.parseInt(str, 16);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4773
                        src.appendCodePoint(cp);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4774
                        buf.appendCodePoint(cp);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4775
                        offBk += (str.length() + 1);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4776
                        if (ln.charAt(offBk) == '\u00f7') {    // DIV
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4777
                            graphemes.add(buf.toString());
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4778
                            buf = new StringBuilder();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4779
                        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4780
                    }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4781
                    Pattern p = Pattern.compile("\\X");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4782
                    Matcher m = p.matcher(src.toString());
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4783
                    Scanner s = new Scanner(src.toString()).useDelimiter("\\b{g}");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4784
                    for (String g : graphemes) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4785
                        // System.out.printf("     grapheme:=[%s]%n", g);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4786
                        // (1) test \\X directly
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4787
                        if (!m.find() || !m.group().equals(g)) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4788
                            System.out.println("Failed \\X [" + ln + "] : " + g);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4789
                            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4790
                        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4791
                        // (2) test \\b{g} + \\X  via Scanner
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4792
                        boolean hasNext = s.hasNext(p);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4793
                        // if (!s.hasNext() || !s.next().equals(next)) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4794
                        if (!s.hasNext(p) || !s.next(p).equals(g)) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4795
                            System.out.println("Failed b{g} [" + ln + "] : " + g);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4796
                            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4797
                        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4798
                    }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4799
                });
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4800
        // some sanity checks
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4801
        if (!Pattern.compile("\\X{10}").matcher("abcdefghij").matches() ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4802
            !Pattern.compile("\\b{g}(?:\\X\\b{g}){5}\\b{g}").matcher("abcde").matches() ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4803
            !Pattern.compile("(?:\\X\\b{g}){2}").matcher("\ud800\udc00\ud801\udc02").matches())
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4804
            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4805
        // make sure "\b{n}" still works
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4806
        if (!Pattern.compile("\\b{1}hello\\b{1} \\b{1}world\\b{1}").matcher("hello world").matches())
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4807
            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4808
        report("Unicode extended grapheme cluster");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4809
    }
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4810
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4811
    // hangup/timeout if go into exponential backtracking
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4812
    private static void expoBacktracking() throws Exception {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4813
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4814
        Object[][] patternMatchers = {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4815
            // 6328855
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4816
            { "(.*\n*)*",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4817
              "this little fine string lets\r\njava.lang.String.matches\r\ncrash\r\n(We don't know why but adding \r* to the regex makes it work again)",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4818
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4819
            // 6192895
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4820
            { " *([a-zA-Z0-9/\\-\\?:\\(\\)\\.,'\\+\\{\\}]+ *)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4821
              "Hello World this is a test this is a test this is a test A",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4822
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4823
            { " *([a-zA-Z0-9/\\-\\?:\\(\\)\\.,'\\+\\{\\}]+ *)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4824
              "Hello World this is a test this is a test this is a test \u4e00 ",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4825
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4826
            { " *([a-z0-9]+ *)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4827
              "hello world this is a test this is a test this is a test A",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4828
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4829
            // 4771934 [FIXED] #5013651?
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4830
            { "^(\\w+([\\.-]?\\w+)*@\\w+([\\.-]?\\w+)*(\\.\\w{2,4})+[,;]?)+$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4831
              "abc@efg.abc,efg@abc.abc,abc@xyz.mno;abc@sdfsd.com",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4832
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4833
            // 4866249 [FIXED]
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4834
            { "<\\s*" + "(meta|META)" + "(\\s|[^>])+" + "(CHARSET|charset)=" + "(\\s|[^>])+>",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4835
              "<META http-equiv=\"Content-Type\" content=\"text/html; charset=ISO-8859-5\">",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4836
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4837
            { "^(\\w+([\\.-]?\\w+)*@\\w+([\\.-]?\\w+)*(\\.\\w{2,4})+[,;]?)+$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4838
              "abc@efg.abc,efg@abc.abc,abc@xyz.mno;sdfsd.com",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4839
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4840
            // 6345469
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4841
            { "((<[^>]+>)?(((\\s)?)*(\\&nbsp;)?)*((\\s)?)*)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4842
              "&nbsp;&nbsp; < br/> &nbsp; < / p> <p> <html> <adfasfdasdf>&nbsp; </p>",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4843
              true }, // --> matched
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4844
            { "((<[^>]+>)?(((\\s)?)*(\\&nbsp;)?)*((\\s)?)*)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4845
              "&nbsp;&nbsp; < br/> &nbsp; < / p> <p> <html> <adfasfdasdf>&nbsp; p </p>",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4846
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4847
            // 5026912
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4848
            { "^\\s*" + "(\\w|\\d|[\\xC0-\\xFF]|/)+" + "\\s+|$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4849
              "156580451111112225588087755221111111566969655555555",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4850
              false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4851
            // 6988218
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4852
            { "^([+-]?((0[xX](\\p{XDigit}+))|(((\\p{Digit}+)(\\.)?((\\p{Digit}+)?)([eE][+-]?(\\p{Digit}+))?)|(\\.((\\p{Digit}+))([eE][+-]?(\\p{Digit}+))?)))|[n|N]?'([^']*(?:'')*[^']*)*')",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4853
              "'%)) order by ANGEBOT.ID",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4854
              false},    // find
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4855
            // 6693451
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4856
            { "^(\\s*foo\\s*)*$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4857
              "foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4858
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4859
            { "^(\\s*foo\\s*)*$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4860
              "foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo fo",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4861
              false
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4862
            },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4863
            // 7006761
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4864
            { "(([0-9A-Z]+)([_]?+)*)*", "FOOOOO_BAAAR_FOOOOOOOOO_BA_", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4865
            { "(([0-9A-Z]+)([_]?+)*)*", "FOOOOO_BAAAR_FOOOOOOOOO_BA_ ", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4866
            // 8140212
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4867
            { "(?<before>.*)\\{(?<reflection>\\w+):(?<innerMethod>\\w+(\\.?\\w+(\\(((?<args>(('[^']*')|((/|\\w)+))(,(('[^']*')|((/|\\w)+)))*))?\\))?)*)\\}(?<after>.*)",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4868
              "{CeGlobal:getSodCutoff.getGui.getAmqp.getSimpleModeEnabled()",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4869
              false
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4870
            },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4871
            { "^(a+)+$", "aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4872
            { "^(a+)+$", "aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa!", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4873
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4874
            { "(x+)*y",  "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxy", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4875
            { "(x+)*y",  "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxz", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4876
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4877
            { "(x+x+)+y", "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxy", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4878
            { "(x+x+)+y", "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxz", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4879
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4880
            { "(([0-9A-Z]+)([_]?+)*)*", "--------------------------------------", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4881
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4882
            /* not fixed
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4883
            //8132141   --->    second level exponential backtracking
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4884
            { "(h|h|ih(((i|a|c|c|a|i|i|j|b|a|i|b|a|a|j))+h)ahbfhba|c|i)*",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4885
              "hchcchicihcchciiicichhcichcihcchiihichiciiiihhcchicchhcihchcihiihciichhccciccichcichiihcchcihhicchcciicchcccihiiihhihihihichicihhcciccchihhhcchichchciihiicihciihcccciciccicciiiiiiiiicihhhiiiihchccchchhhhiiihchihcccchhhiiiiiiiicicichicihcciciihichhhhchihciiihhiccccccciciihhichiccchhicchicihihccichicciihcichccihhiciccccccccichhhhihihhcchchihihiihhihihihicichihiiiihhhhihhhchhichiicihhiiiiihchccccchichci" },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4886
            */
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4887
        };
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4888
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4889
        for (Object[] pm : patternMatchers) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4890
            String p = (String)pm[0];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4891
            String s = (String)pm[1];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4892
            boolean r = (Boolean)pm[2];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4893
            if (r != Pattern.compile(p).matcher(s).matches()) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4894
                failCount++;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4895
            }
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4896
        }
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4897
    }
48853
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4898
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4899
    private static void invalidGroupName() {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4900
        // Invalid start of a group name
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4901
        for (String groupName : List.of("", ".", "0", "\u0040", "\u005b",
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4902
                "\u0060", "\u007b", "\u0416")) {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4903
            for (String pat : List.of("(?<" + groupName + ">)",
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4904
                    "\\k<" + groupName + ">")) {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4905
                try {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4906
                    Pattern.compile(pat);
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4907
                    failCount++;
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4908
                } catch (PatternSyntaxException e) {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4909
                    if (!e.getMessage().startsWith(
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4910
                            "capturing group name does not start with a"
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4911
                            + " Latin letter")) {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4912
                        failCount++;
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4913
                    }
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4914
                }
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4915
            }
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4916
        }
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4917
        // Invalid char in a group name
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4918
        for (String groupName : List.of("a.", "b\u0040", "c\u005b",
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4919
                "d\u0060", "e\u007b", "f\u0416")) {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4920
            for (String pat : List.of("(?<" + groupName + ">)",
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4921
                    "\\k<" + groupName + ">")) {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4922
                try {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4923
                    Pattern.compile(pat);
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4924
                    failCount++;
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4925
                } catch (PatternSyntaxException e) {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4926
                    if (!e.getMessage().startsWith(
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4927
                            "named capturing group is missing trailing '>'")) {
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4928
                        failCount++;
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4929
                    }
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4930
                }
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4931
            }
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4932
        }
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4933
        report("Invalid capturing group names");
84b4ffbba8b0 8197462: Inconsistent exception messages for invalid capturing group names
igerasim
parents: 48491
diff changeset
  4934
    }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4935
}