jdk/test/java/util/regex/RegExTest.java
author sherman
Fri, 20 May 2016 12:47:41 -0700
changeset 38450 516990ff3a4c
parent 37882 e7f3cf12e739
child 38777 826eb7091523
permissions -rw-r--r--
8143282: \p{Cn} unassigned code points should be included in \p{C} Summary: to add unassigned cp support into \p{C} Reviewed-by: martin
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     1
/*
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
     2
 * Copyright (c) 1999, 2015, Oracle and/or its affiliates. All rights reserved.
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     4
 *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
21596
0e3a39f29dbc 8027696: Incorrect copyright header in the tests
serb
parents: 19604
diff changeset
     7
 * published by the Free Software Foundation.
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     8
 *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     9
 * This code is distributed in the hope that it will be useful, but WITHOUT
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    12
 * version 2 for more details (a copy is included in the LICENSE file that
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    13
 * accompanied this code).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    14
 *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    15
 * You should have received a copy of the GNU General Public License version
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    16
 * 2 along with this work; if not, write to the Free Software Foundation,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    18
 *
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 5295
diff changeset
    19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 5295
diff changeset
    20
 * or visit www.oracle.com if you need additional information or have any
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 5295
diff changeset
    21
 * questions.
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    22
 */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    23
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    24
/**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    25
 * @test
30370
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    26
 * @summary tests RegExp framework (use -Dseed=X to set PRNG seed)
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    27
 * @author Mike McCloskey
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    28
 * @bug 4481568 4482696 4495089 4504687 4527731 4599621 4631553 4619345
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    29
 * 4630911 4672616 4711773 4727935 4750573 4792284 4803197 4757029 4808962
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    30
 * 4872664 4803179 4892980 4900747 4945394 4938995 4979006 4994840 4997476
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    31
 * 5013885 5003322 4988891 5098443 5110268 6173522 4829857 5027748 6376940
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    32
 * 6358731 6178785 6284152 6231989 6497148 6486934 6233084 6504326 6635133
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
    33
 * 6350801 6676425 6878475 6919132 6931676 6948903 6990617 7014645 7039066
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
    34
 * 7067045 7014640 7189363 8007395 8013252 8013254 8012646 8023647 6559590
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
    35
 * 8027645 8035076 8039124 8035975 8074678 6854417 8143854 8147531 7071819
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
    36
 * 8151481 4867170 7080302 6728861 6995635 6736245 4916384
38450
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
    37
 * 6328855 6192895 6345469 6988218 6693451 7006761 8140212 8143282
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
    38
 *
30370
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    39
 * @library /lib/testlibrary
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    40
 * @build jdk.testlibrary.*
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    41
 * @run main RegExTest
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
    42
 * @key randomness
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    43
 */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    44
29243
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
    45
import java.util.function.Function;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    46
import java.util.regex.*;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    47
import java.util.Random;
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
    48
import java.util.Scanner;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    49
import java.io.*;
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
    50
import java.nio.file.*;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    51
import java.util.*;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    52
import java.nio.CharBuffer;
17447
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
    53
import java.util.function.Predicate;
30436
17827057ef5a 8079782: RandomFactory should be in the jdk.testlibrary package
chegar
parents: 30375
diff changeset
    54
import jdk.testlibrary.RandomFactory;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    55
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    56
/**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    57
 * This is a test class created to check the operation of
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    58
 * the Pattern and Matcher classes.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    59
 */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    60
public class RegExTest {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    61
30370
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    62
    private static Random generator = RandomFactory.getRandom();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    63
    private static boolean failure = false;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    64
    private static int failCount = 0;
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
    65
    private static String firstFailure = null;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    66
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    67
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    68
     * Main to interpret arguments and run several tests.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    69
     *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    70
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    71
    public static void main(String[] args) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    72
        // Most of the tests are in a file
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    73
        processFile("TestCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    74
        //processFile("PerlCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    75
        processFile("BMPTestCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    76
        processFile("SupplementaryTestCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    77
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    78
        // These test many randomly generated char patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    79
        bm();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    80
        slice();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    81
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    82
        // These are hard to put into the file
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    83
        escapes();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    84
        blankInput();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    85
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    86
        // Substitition tests on randomly generated sequences
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    87
        globalSubstitute();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    88
        stringbufferSubstitute();
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
    89
        stringbuilderSubstitute();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
    90
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    91
        substitutionBasher();
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
    92
        substitutionBasher2();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    93
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    94
        // Canonical Equivalence
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    95
        ceTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    96
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    97
        // Anchors
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    98
        anchorTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    99
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   100
        // boolean match calls
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   101
        matchesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   102
        lookingAtTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   103
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   104
        // Pattern API
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   105
        patternMatchesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   106
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   107
        // Misc
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   108
        lookbehindTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   109
        nullArgumentTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   110
        backRefTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   111
        groupCaptureTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   112
        caretTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   113
        charClassTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   114
        emptyPatternTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   115
        findIntTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   116
        group0Test();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   117
        longPatternTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   118
        octalTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   119
        ampersandTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   120
        negationTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   121
        splitTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   122
        appendTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   123
        caseFoldingTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   124
        commentsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   125
        unixLinesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   126
        replaceFirstTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   127
        gTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   128
        zTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   129
        serializeTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   130
        reluctantRepetitionTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   131
        multilineDollarTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   132
        dollarAtEndTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   133
        caretBetweenTerminatorsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   134
        // This RFE rejected in Tiger numOccurrencesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   135
        javaCharClassTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   136
        nonCaptureRepetitionTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   137
        notCapturedGroupCurlyMatchTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   138
        escapedSegmentTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   139
        literalPatternTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   140
        literalReplacementTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   141
        regionTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   142
        toStringTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   143
        negatedCharClassTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   144
        findFromTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   145
        boundsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   146
        unicodeWordBoundsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   147
        caretAtEndTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   148
        wordSearchTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   149
        hitEndTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   150
        toMatchResultTest();
29503
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   151
        toMatchResultTest2();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   152
        surrogatesInClassTest();
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   153
        removeQEQuotingTest();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   154
        namedGroupCaptureTest();
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
   155
        nonBmpClassComplementTest();
5610
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
   156
        unicodePropertiesTest();
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   157
        unicodeHexNotationTest();
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
   158
        unicodeClassesTest();
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
   159
        unicodeCharacterNameTest();
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   160
        horizontalAndVerticalWSTest();
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   161
        linebreakTest();
13554
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
   162
        branchTest();
17183
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
   163
        groupCurlyNotFoundSuppTest();
19604
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
   164
        groupCurlyBackoffTest();
17447
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
   165
        patternAsPredicate();
25523
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
   166
        invalidFlags();
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
   167
        grapheme();
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
   168
        expoBacktracking();
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
   169
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   170
        if (failure) {
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   171
            throw new
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   172
                RuntimeException("RegExTest failed, 1st failure: " +
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   173
                                 firstFailure);
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   174
        } else {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   175
            System.err.println("OKAY: All tests passed.");
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   176
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   177
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   178
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   179
    // Utility functions
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   180
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   181
    private static String getRandomAlphaString(int length) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   182
        StringBuffer buf = new StringBuffer(length);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   183
        for (int i=0; i<length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   184
            char randChar = (char)(97 + generator.nextInt(26));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   185
            buf.append(randChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   186
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   187
        return buf.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   188
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   189
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   190
    private static void check(Matcher m, String expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   191
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   192
        if (!m.group().equals(expected))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   193
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   194
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   195
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   196
    private static void check(Matcher m, String result, boolean expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   197
        m.find();
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   198
        if (m.group().equals(result) != expected)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   199
            failCount++;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   200
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   201
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   202
    private static void check(Pattern p, String s, boolean expected) {
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   203
        if (p.matcher(s).find() != expected)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   204
            failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   205
    }
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   206
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   207
    private static void check(String p, String s, boolean expected) {
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   208
        Matcher matcher = Pattern.compile(p).matcher(s);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   209
        if (matcher.find() != expected)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   210
            failCount++;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   211
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   212
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   213
    private static void check(String p, char c, boolean expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   214
        String propertyPattern = expected ? "\\p" + p : "\\P" + p;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   215
        Pattern pattern = Pattern.compile(propertyPattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   216
        char[] ca = new char[1]; ca[0] = c;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   217
        Matcher matcher = pattern.matcher(new String(ca));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   218
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   219
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   220
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   221
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   222
    private static void check(String p, int codePoint, boolean expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   223
        String propertyPattern = expected ? "\\p" + p : "\\P" + p;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   224
        Pattern pattern = Pattern.compile(propertyPattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   225
        char[] ca = Character.toChars(codePoint);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   226
        Matcher matcher = pattern.matcher(new String(ca));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   227
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   228
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   229
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   230
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   231
    private static void check(String p, int flag, String input, String s,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   232
                              boolean expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   233
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   234
        Pattern pattern = Pattern.compile(p, flag);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   235
        Matcher matcher = pattern.matcher(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   236
        if (expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   237
            check(matcher, s, expected);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   238
        else
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   239
            check(pattern, input, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   240
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   241
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   242
    private static void report(String testName) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   243
        int spacesToAdd = 30 - testName.length();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   244
        StringBuffer paddedNameBuffer = new StringBuffer(testName);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   245
        for (int i=0; i<spacesToAdd; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   246
            paddedNameBuffer.append(" ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   247
        String paddedName = paddedNameBuffer.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   248
        System.err.println(paddedName + ": " +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   249
                           (failCount==0 ? "Passed":"Failed("+failCount+")"));
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   250
        if (failCount > 0) {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   251
            failure = true;
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   252
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   253
            if (firstFailure == null) {
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   254
                firstFailure = testName;
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   255
            }
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   256
        }
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   257
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   258
        failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   259
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   260
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   261
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   262
     * Converts ASCII alphabet characters [A-Za-z] in the given 's' to
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   263
     * supplementary characters. This method does NOT fully take care
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   264
     * of the regex syntax.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   265
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   266
    private static String toSupplementaries(String s) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   267
        int length = s.length();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   268
        StringBuffer sb = new StringBuffer(length * 2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   269
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   270
        for (int i = 0; i < length; ) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   271
            char c = s.charAt(i++);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   272
            if (c == '\\') {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   273
                sb.append(c);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   274
                if (i < length) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   275
                    c = s.charAt(i++);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   276
                    sb.append(c);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   277
                    if (c == 'u') {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   278
                        // assume no syntax error
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   279
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   280
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   281
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   282
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   283
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   284
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   285
            } else if ((c >= 'A' && c <= 'Z') || (c >= 'a' && c <= 'z')) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   286
                sb.append('\ud800').append((char)('\udc00'+c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   287
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   288
                sb.append(c);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   289
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   290
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   291
        return sb.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   292
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   293
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   294
    // Regular expression tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   295
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   296
    // This is for bug 6178785
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   297
    // Test if an expected NPE gets thrown when passing in a null argument
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   298
    private static boolean check(Runnable test) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   299
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   300
            test.run();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   301
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   302
            return false;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   303
        } catch (NullPointerException npe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   304
            return true;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   305
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   306
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   307
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   308
    private static void nullArgumentTest() {
29243
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   309
        check(() -> Pattern.compile(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   310
        check(() -> Pattern.matches(null, null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   311
        check(() -> Pattern.matches("xyz", null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   312
        check(() -> Pattern.quote(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   313
        check(() -> Pattern.compile("xyz").split(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   314
        check(() -> Pattern.compile("xyz").matcher(null));
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   315
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   316
        final Matcher m = Pattern.compile("xyz").matcher("xyz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   317
        m.matches();
29243
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   318
        check(() -> m.appendTail((StringBuffer) null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   319
        check(() -> m.appendTail((StringBuilder)null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   320
        check(() -> m.replaceAll((String) null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   321
        check(() -> m.replaceAll((Function<MatchResult, String>)null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   322
        check(() -> m.replaceFirst((String)null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   323
        check(() -> m.replaceFirst((Function<MatchResult, String>) null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   324
        check(() -> m.appendReplacement((StringBuffer)null, null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   325
        check(() -> m.appendReplacement((StringBuilder)null, null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   326
        check(() -> m.reset(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   327
        check(() -> Matcher.quoteReplacement(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   328
        //check(() -> m.usePattern(null));
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   329
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   330
        report("Null Argument");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   331
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   332
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   333
    // This is for bug6635133
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   334
    // Test if surrogate pair in Unicode escapes can be handled correctly.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   335
    private static void surrogatesInClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   336
        Pattern pattern = Pattern.compile("[\\ud834\\udd21-\\ud834\\udd24]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   337
        Matcher matcher = pattern.matcher("\ud834\udd22");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   338
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   339
            failCount++;
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   340
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   341
        report("Surrogate pair in Unicode escape");
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   342
    }
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   343
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   344
    // This is for bug6990617
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   345
    // Test if Pattern.RemoveQEQuoting works correctly if the octal unicode
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   346
    // char encoding is only 2 or 3 digits instead of 4 and the first quoted
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   347
    // char is an octal digit.
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   348
    private static void removeQEQuotingTest() throws Exception {
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   349
        Pattern pattern =
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   350
            Pattern.compile("\\011\\Q1sometext\\E\\011\\Q2sometext\\E");
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   351
        Matcher matcher = pattern.matcher("\t1sometext\t2sometext");
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   352
        if (!matcher.find())
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   353
            failCount++;
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   354
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   355
        report("Remove Q/E Quoting");
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   356
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   357
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   358
    // This is for bug 4988891
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   359
    // Test toMatchResult to see that it is a copy of the Matcher
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   360
    // that is not affected by subsequent operations on the original
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   361
    private static void toMatchResultTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   362
        Pattern pattern = Pattern.compile("squid");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   363
        Matcher matcher = pattern.matcher(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   364
            "agiantsquidofdestinyasmallsquidoffate");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   365
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   366
        int matcherStart1 = matcher.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   367
        MatchResult mr = matcher.toMatchResult();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   368
        if (mr == matcher)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   369
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   370
        int resultStart1 = mr.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   371
        if (matcherStart1 != resultStart1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   372
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   373
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   374
        int matcherStart2 = matcher.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   375
        int resultStart2 = mr.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   376
        if (matcherStart2 == resultStart2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   377
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   378
        if (resultStart1 != resultStart2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   379
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   380
        MatchResult mr2 = matcher.toMatchResult();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   381
        if (mr == mr2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   382
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   383
        if (mr2.start() != matcherStart2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   384
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   385
        report("toMatchResult is a copy");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   386
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   387
29503
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   388
    private static void checkExpectedISE(Runnable test) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   389
        try {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   390
            test.run();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   391
            failCount++;
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   392
        } catch (IllegalStateException x) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   393
        } catch (IndexOutOfBoundsException xx) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   394
            failCount++;
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   395
        }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   396
    }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   397
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   398
    private static void checkExpectedIOOE(Runnable test) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   399
        try {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   400
            test.run();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   401
            failCount++;
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   402
        } catch (IndexOutOfBoundsException x) {}
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   403
    }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   404
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   405
    // This is for bug 8074678
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   406
    // Test the result of toMatchResult throws ISE if no match is availble
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   407
    private static void toMatchResultTest2() throws Exception {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   408
        Matcher matcher = Pattern.compile("nomatch").matcher("hello world");
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   409
        matcher.find();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   410
        MatchResult mr = matcher.toMatchResult();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   411
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   412
        checkExpectedISE(() -> mr.start());
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   413
        checkExpectedISE(() -> mr.start(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   414
        checkExpectedISE(() -> mr.end());
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   415
        checkExpectedISE(() -> mr.end(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   416
        checkExpectedISE(() -> mr.group());
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   417
        checkExpectedISE(() -> mr.group(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   418
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   419
        matcher = Pattern.compile("(match)").matcher("there is a match");
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   420
        matcher.find();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   421
        MatchResult mr2 = matcher.toMatchResult();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   422
        checkExpectedIOOE(() -> mr2.start(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   423
        checkExpectedIOOE(() -> mr2.end(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   424
        checkExpectedIOOE(() -> mr2.group(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   425
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   426
        report("toMatchResult2 appropriate exceptions");
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   427
    }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   428
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   429
    // This is for bug 5013885
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   430
    // Must test a slice to see if it reports hitEnd correctly
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   431
    private static void hitEndTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   432
        // Basic test of Slice node
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   433
        Pattern p = Pattern.compile("^squidattack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   434
        Matcher m = p.matcher("squack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   435
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   436
        if (m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   437
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   438
        m.reset("squid");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   439
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   440
        if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   441
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   442
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   443
        // Test Slice, SliceA and SliceU nodes
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   444
        for (int i=0; i<3; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   445
            int flags = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   446
            if (i==1) flags = Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   447
            if (i==2) flags = Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   448
            p = Pattern.compile("^abc", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   449
            m = p.matcher("ad");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   450
            m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   451
            if (m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   452
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   453
            m.reset("ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   454
            m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   455
            if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   456
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   457
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   458
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   459
        // Test Boyer-Moore node
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   460
        p = Pattern.compile("catattack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   461
        m = p.matcher("attack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   462
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   463
        if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   464
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   465
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   466
        p = Pattern.compile("catattack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   467
        m = p.matcher("attackattackattackcatatta");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   468
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   469
        if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   470
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   471
        report("hitEnd from a Slice");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   472
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   473
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   474
    // This is for bug 4997476
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   475
    // It is weird code submitted by customer demonstrating a regression
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   476
    private static void wordSearchTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   477
        String testString = new String("word1 word2 word3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   478
        Pattern p = Pattern.compile("\\b");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   479
        Matcher m = p.matcher(testString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   480
        int position = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   481
        int start = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   482
        while (m.find(position)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   483
            start = m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   484
            if (start == testString.length())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   485
                break;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   486
            if (m.find(start+1)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   487
                position = m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   488
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   489
                position = testString.length();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   490
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   491
            if (testString.substring(start, position).equals(" "))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   492
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   493
            if (!testString.substring(start, position-1).startsWith("word"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   494
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   495
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   496
        report("Customer word search");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   497
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   498
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   499
    // This is for bug 4994840
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   500
    private static void caretAtEndTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   501
        // Problem only occurs with multiline patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   502
        // containing a beginning-of-line caret "^" followed
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   503
        // by an expression that also matches the empty string.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   504
        Pattern pattern = Pattern.compile("^x?", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   505
        Matcher matcher = pattern.matcher("\r");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   506
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   507
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   508
        report("Caret at end");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   509
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   510
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   511
    // This test is for 4979006
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   512
    // Check to see if word boundary construct properly handles unicode
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   513
    // non spacing marks
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   514
    private static void unicodeWordBoundsTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   515
        String spaces = "  ";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   516
        String wordChar = "a";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   517
        String nsm = "\u030a";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   518
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   519
        assert (Character.getType('\u030a') == Character.NON_SPACING_MARK);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   520
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   521
        Pattern pattern = Pattern.compile("\\b");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   522
        Matcher matcher = pattern.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   523
        // S=other B=word character N=non spacing mark .=word boundary
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   524
        // SS.BB.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   525
        String input = spaces + wordChar + wordChar + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   526
        twoFindIndexes(input, matcher, 2, 4);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   527
        // SS.BBN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   528
        input = spaces + wordChar +wordChar + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   529
        twoFindIndexes(input, matcher, 2, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   530
        // SS.BN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   531
        input = spaces + wordChar + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   532
        twoFindIndexes(input, matcher, 2, 4);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   533
        // SS.BNN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   534
        input = spaces + wordChar + nsm + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   535
        twoFindIndexes(input, matcher, 2, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   536
        // SSN.BB.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   537
        input = spaces + nsm + wordChar + wordChar + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   538
        twoFindIndexes(input, matcher, 3, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   539
        // SS.BNB.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   540
        input = spaces + wordChar + nsm + wordChar + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   541
        twoFindIndexes(input, matcher, 2, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   542
        // SSNNSS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   543
        input = spaces + nsm + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   544
        matcher.reset(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   545
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   546
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   547
        // SSN.BBN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   548
        input = spaces + nsm + wordChar + wordChar + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   549
        twoFindIndexes(input, matcher, 3, 6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   550
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   551
        report("Unicode word boundary");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   552
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   553
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   554
    private static void twoFindIndexes(String input, Matcher matcher, int a,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   555
                                       int b) throws Exception
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   556
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   557
        matcher.reset(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   558
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   559
        if (matcher.start() != a)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   560
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   561
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   562
        if (matcher.start() != b)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   563
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   564
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   565
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   566
    // This test is for 6284152
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   567
    static void check(String regex, String input, String[] expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   568
        List<String> result = new ArrayList<String>();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   569
        Pattern p = Pattern.compile(regex);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   570
        Matcher m = p.matcher(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   571
        while (m.find()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   572
            result.add(m.group());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   573
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   574
        if (!Arrays.asList(expected).equals(result))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   575
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   576
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   577
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   578
    private static void lookbehindTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   579
        //Positive
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   580
        check("(?<=%.{0,5})foo\\d",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   581
              "%foo1\n%bar foo2\n%bar  foo3\n%blahblah foo4\nfoo5",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   582
              new String[]{"foo1", "foo2", "foo3"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   583
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   584
        //boundary at end of the lookbehind sub-regex should work consistently
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   585
        //with the boundary just after the lookbehind sub-regex
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   586
        check("(?<=.*\\b)foo", "abcd foo", new String[]{"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   587
        check("(?<=.*)\\bfoo", "abcd foo", new String[]{"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   588
        check("(?<!abc )\\bfoo", "abc foo", new String[0]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   589
        check("(?<!abc \\b)foo", "abc foo", new String[0]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   590
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   591
        //Negative
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   592
        check("(?<!%.{0,5})foo\\d",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   593
              "%foo1\n%bar foo2\n%bar  foo3\n%blahblah foo4\nfoo5",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   594
              new String[] {"foo4", "foo5"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   595
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   596
        //Positive greedy
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   597
        check("(?<=%b{1,4})foo", "%bbbbfoo", new String[] {"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   598
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   599
        //Positive reluctant
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   600
        check("(?<=%b{1,4}?)foo", "%bbbbfoo", new String[] {"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   601
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   602
        //supplementary
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   603
        check("(?<=%b{1,4})fo\ud800\udc00o", "%bbbbfo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   604
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   605
        check("(?<=%b{1,4}?)fo\ud800\udc00o", "%bbbbfo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   606
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   607
        check("(?<!%b{1,4})fo\ud800\udc00o", "%afo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   608
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   609
        check("(?<!%b{1,4}?)fo\ud800\udc00o", "%afo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   610
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   611
        report("Lookbehind");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   612
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   613
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   614
    // This test is for 4938995
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   615
    // Check to see if weak region boundaries are transparent to
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   616
    // lookahead and lookbehind constructs
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   617
    private static void boundsTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   618
        String fullMessage = "catdogcat";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   619
        Pattern pattern = Pattern.compile("(?<=cat)dog(?=cat)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   620
        Matcher matcher = pattern.matcher("catdogca");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   621
        matcher.useTransparentBounds(true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   622
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   623
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   624
        matcher.reset("atdogcat");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   625
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   626
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   627
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   628
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   629
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   630
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   631
        matcher.region(0,9);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   632
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   633
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   634
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   635
        matcher.region(0,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   636
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   637
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   638
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   639
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   640
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   641
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   642
        matcher.useTransparentBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   643
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   644
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   645
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   646
        // Negative lookahead/lookbehind
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   647
        pattern = Pattern.compile("(?<!cat)dog(?!cat)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   648
        matcher = pattern.matcher("dogcat");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   649
        matcher.useTransparentBounds(true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   650
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   651
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   652
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   653
        matcher.reset("catdog");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   654
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   655
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   656
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   657
        matcher.useTransparentBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   658
        matcher.reset("dogcat");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   659
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   660
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   661
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   662
        matcher.reset("catdog");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   663
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   664
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   665
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   666
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   667
        report("Region bounds transparency");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   668
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   669
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   670
    // This test is for 4945394
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   671
    private static void findFromTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   672
        String message = "This is 40 $0 message.";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   673
        Pattern pat = Pattern.compile("\\$0");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   674
        Matcher match = pat.matcher(message);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   675
        if (!match.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   676
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   677
        if (match.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   678
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   679
        if (match.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   680
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   681
        report("Check for alternating find");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   682
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   683
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   684
    // This test is for 4872664 and 4892980
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   685
    private static void negatedCharClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   686
        Pattern pattern = Pattern.compile("[^>]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   687
        Matcher matcher = pattern.matcher("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   688
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   689
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   690
        pattern = Pattern.compile("[^fr]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   691
        matcher = pattern.matcher("a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   692
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   693
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   694
        matcher.reset("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   695
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   696
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   697
        String s = "for";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   698
        String result[] = s.split("[^fr]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   699
        if (!result[0].equals("f"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   700
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   701
        if (!result[1].equals("r"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   702
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   703
        s = "f\u203Ar";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   704
        result = s.split("[^fr]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   705
        if (!result[0].equals("f"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   706
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   707
        if (!result[1].equals("r"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   708
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   709
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   710
        // Test adding to bits, subtracting a node, then adding to bits again
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   711
        pattern = Pattern.compile("[^f\u203Ar]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   712
        matcher = pattern.matcher("a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   713
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   714
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   715
        matcher.reset("f");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   716
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   717
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   718
        matcher.reset("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   719
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   720
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   721
        matcher.reset("r");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   722
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   723
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   724
        matcher.reset("\u203B");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   725
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   726
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   727
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   728
        // Test subtracting a node, adding to bits, subtracting again
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   729
        pattern = Pattern.compile("[^\u203Ar\u203B]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   730
        matcher = pattern.matcher("a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   731
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   732
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   733
        matcher.reset("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   734
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   735
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   736
        matcher.reset("r");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   737
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   738
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   739
        matcher.reset("\u203B");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   740
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   741
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   742
        matcher.reset("\u203C");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   743
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   744
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   745
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   746
        report("Negated Character Class");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   747
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   748
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   749
    // This test is for 4628291
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   750
    private static void toStringTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   751
        Pattern pattern = Pattern.compile("b+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   752
        if (pattern.toString() != "b+")
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   753
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   754
        Matcher matcher = pattern.matcher("aaabbbccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   755
        String matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   756
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   757
        matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   758
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   759
        matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   760
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   761
        matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   762
        report("toString");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   763
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   764
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   765
    // This test is for 4808962
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   766
    private static void literalPatternTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   767
        int flags = Pattern.LITERAL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   768
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   769
        Pattern pattern = Pattern.compile("abc\\t$^", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   770
        check(pattern, "abc\\t$^", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   771
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   772
        pattern = Pattern.compile(Pattern.quote("abc\\t$^"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   773
        check(pattern, "abc\\t$^", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   774
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   775
        pattern = Pattern.compile("\\Qa^$bcabc\\E", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   776
        check(pattern, "\\Qa^$bcabc\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   777
        check(pattern, "a^$bcabc", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   778
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   779
        pattern = Pattern.compile("\\\\Q\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   780
        check(pattern, "\\Q\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   781
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   782
        pattern = Pattern.compile("\\Qabc\\Eefg\\\\Q\\\\Ehij");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   783
        check(pattern, "abcefg\\Q\\Ehij", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   784
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   785
        pattern = Pattern.compile("\\\\\\Q\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   786
        check(pattern, "\\\\\\\\", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   787
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   788
        pattern = Pattern.compile(Pattern.quote("\\Qa^$bcabc\\E"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   789
        check(pattern, "\\Qa^$bcabc\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   790
        check(pattern, "a^$bcabc", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   791
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   792
        pattern = Pattern.compile(Pattern.quote("\\Qabc\\Edef"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   793
        check(pattern, "\\Qabc\\Edef", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   794
        check(pattern, "abcdef", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   795
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   796
        pattern = Pattern.compile(Pattern.quote("abc\\Edef"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   797
        check(pattern, "abc\\Edef", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   798
        check(pattern, "abcdef", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   799
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   800
        pattern = Pattern.compile(Pattern.quote("\\E"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   801
        check(pattern, "\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   802
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   803
        pattern = Pattern.compile("((((abc.+?:)", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   804
        check(pattern, "((((abc.+?:)", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   805
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   806
        flags |= Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   807
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   808
        pattern = Pattern.compile("^cat$", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   809
        check(pattern, "abc^cat$def", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   810
        check(pattern, "cat", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   811
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   812
        flags |= Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   813
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   814
        pattern = Pattern.compile("abcdef", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   815
        check(pattern, "ABCDEF", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   816
        check(pattern, "AbCdEf", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   817
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   818
        flags |= Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   819
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   820
        pattern = Pattern.compile("a...b", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   821
        check(pattern, "A...b", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   822
        check(pattern, "Axxxb", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   823
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   824
        flags |= Pattern.CANON_EQ;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   825
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   826
        Pattern p = Pattern.compile("testa\u030a", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   827
        check(pattern, "testa\u030a", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   828
        check(pattern, "test\u00e5", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   829
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   830
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   831
        flags = Pattern.LITERAL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   832
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   833
        pattern = Pattern.compile(toSupplementaries("abc\\t$^"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   834
        check(pattern, toSupplementaries("abc\\t$^"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   835
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   836
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("abc\\t$^")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   837
        check(pattern, toSupplementaries("abc\\t$^"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   838
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   839
        pattern = Pattern.compile(toSupplementaries("\\Qa^$bcabc\\E"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   840
        check(pattern, toSupplementaries("\\Qa^$bcabc\\E"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   841
        check(pattern, toSupplementaries("a^$bcabc"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   842
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   843
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("\\Qa^$bcabc\\E")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   844
        check(pattern, toSupplementaries("\\Qa^$bcabc\\E"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   845
        check(pattern, toSupplementaries("a^$bcabc"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   846
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   847
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("\\Qabc\\Edef")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   848
        check(pattern, toSupplementaries("\\Qabc\\Edef"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   849
        check(pattern, toSupplementaries("abcdef"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   850
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   851
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("abc\\Edef")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   852
        check(pattern, toSupplementaries("abc\\Edef"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   853
        check(pattern, toSupplementaries("abcdef"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   854
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   855
        pattern = Pattern.compile(toSupplementaries("((((abc.+?:)"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   856
        check(pattern, toSupplementaries("((((abc.+?:)"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   857
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   858
        flags |= Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   859
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   860
        pattern = Pattern.compile(toSupplementaries("^cat$"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   861
        check(pattern, toSupplementaries("abc^cat$def"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   862
        check(pattern, toSupplementaries("cat"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   863
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   864
        flags |= Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   865
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   866
        // note: this is case-sensitive.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   867
        pattern = Pattern.compile(toSupplementaries("a...b"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   868
        check(pattern, toSupplementaries("a...b"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   869
        check(pattern, toSupplementaries("axxxb"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   870
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   871
        flags |= Pattern.CANON_EQ;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   872
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   873
        String t = toSupplementaries("test");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   874
        p = Pattern.compile(t + "a\u030a", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   875
        check(pattern, t + "a\u030a", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   876
        check(pattern, t + "\u00e5", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   877
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   878
        report("Literal pattern");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   879
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   880
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   881
    // This test is for 4803179
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   882
    // This test is also for 4808962, replacement parts
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   883
    private static void literalReplacementTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   884
        int flags = Pattern.LITERAL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   885
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   886
        Pattern pattern = Pattern.compile("abc", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   887
        Matcher matcher = pattern.matcher("zzzabczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   888
        String replaceTest = "$0";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   889
        String result = matcher.replaceAll(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   890
        if (!result.equals("zzzabczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   891
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   892
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   893
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   894
        String literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   895
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   896
        if (!result.equals("zzz$0zzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   897
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   898
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   899
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   900
        replaceTest = "\\t$\\$";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   901
        literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   902
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   903
        if (!result.equals("zzz\\t$\\$zzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   904
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   905
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   906
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   907
        pattern = Pattern.compile(toSupplementaries("abc"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   908
        matcher = pattern.matcher(toSupplementaries("zzzabczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   909
        replaceTest = "$0";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   910
        result = matcher.replaceAll(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   911
        if (!result.equals(toSupplementaries("zzzabczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   912
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   913
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   914
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   915
        literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   916
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   917
        if (!result.equals(toSupplementaries("zzz$0zzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   918
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   919
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   920
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   921
        replaceTest = "\\t$\\$";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   922
        literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   923
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   924
        if (!result.equals(toSupplementaries("zzz\\t$\\$zzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   925
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   926
12432
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   927
        // IAE should be thrown if backslash or '$' is the last character
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   928
        // in replacement string
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   929
        try {
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   930
            "\uac00".replaceAll("\uac00", "$");
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   931
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   932
        } catch (IllegalArgumentException iie) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   933
        } catch (Exception e) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   934
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   935
        }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   936
        try {
12432
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   937
            "\uac00".replaceAll("\uac00", "\\");
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   938
            failCount++;
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   939
        } catch (IllegalArgumentException iie) {
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   940
        } catch (Exception e) {
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   941
            failCount++;
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   942
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   943
        report("Literal replacement");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   944
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   945
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   946
    // This test is for 4757029
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   947
    private static void regionTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   948
        Pattern pattern = Pattern.compile("abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   949
        Matcher matcher = pattern.matcher("abcdefabc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   950
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   951
        matcher.region(0,9);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   952
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   953
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   954
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   955
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   956
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   957
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   958
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   959
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   960
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   961
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   962
        matcher.region(0,2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   963
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   964
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   965
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   966
        expectRegionFail(matcher, 1, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   967
        expectRegionFail(matcher, -1, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   968
        expectRegionFail(matcher, -1, 1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   969
        expectRegionFail(matcher, 5, 3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   970
        expectRegionFail(matcher, 5, 12);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   971
        expectRegionFail(matcher, 12, 12);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   972
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   973
        pattern = Pattern.compile("^abc$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   974
        matcher = pattern.matcher("zzzabczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   975
        matcher.region(0,9);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   976
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   977
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   978
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   979
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   980
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   981
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   982
        matcher.useAnchoringBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   983
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   984
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   985
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   986
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   987
        pattern = Pattern.compile(toSupplementaries("abc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   988
        matcher = pattern.matcher(toSupplementaries("abcdefabc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   989
        matcher.region(0,9*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   990
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   991
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   992
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   993
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   994
        matcher.region(0,3*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   995
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   996
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   997
        matcher.region(1,3*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   998
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   999
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1000
        matcher.region(3*2,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1001
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1002
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1003
        matcher.region(0,2*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1004
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1005
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1006
        matcher.region(0,2*2+1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1007
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1008
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1009
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1010
        expectRegionFail(matcher, 1*2, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1011
        expectRegionFail(matcher, -1, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1012
        expectRegionFail(matcher, -1, 1*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1013
        expectRegionFail(matcher, 5*2, 3*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1014
        expectRegionFail(matcher, 5*2, 12*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1015
        expectRegionFail(matcher, 12*2, 12*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1016
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1017
        pattern = Pattern.compile(toSupplementaries("^abc$"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1018
        matcher = pattern.matcher(toSupplementaries("zzzabczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1019
        matcher.region(0,9*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1020
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1021
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1022
        matcher.region(3*2,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1023
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1024
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1025
        matcher.region(3*2+1,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1026
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1027
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1028
        matcher.region(3*2,6*2-1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1029
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1030
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1031
        matcher.region(3*2,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1032
        matcher.useAnchoringBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1033
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1034
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1035
        report("Regions");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1036
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1037
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1038
    private static void expectRegionFail(Matcher matcher, int index1,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1039
                                         int index2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1040
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1041
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1042
            matcher.region(index1, index2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1043
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1044
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1045
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1046
        } catch (IllegalStateException ise) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1047
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1048
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1049
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1050
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1051
    // This test is for 4803197
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1052
    private static void escapedSegmentTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1053
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1054
        Pattern pattern = Pattern.compile("\\Qdir1\\dir2\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1055
        check(pattern, "dir1\\dir2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1056
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1057
        pattern = Pattern.compile("\\Qdir1\\dir2\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1058
        check(pattern, "dir1\\dir2\\", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1059
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1060
        pattern = Pattern.compile("(\\Qdir1\\dir2\\\\E)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1061
        check(pattern, "dir1\\dir2\\", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1062
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1063
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1064
        pattern = Pattern.compile(toSupplementaries("\\Qdir1\\dir2\\E"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1065
        check(pattern, toSupplementaries("dir1\\dir2"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1066
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1067
        pattern = Pattern.compile(toSupplementaries("\\Qdir1\\dir2")+"\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1068
        check(pattern, toSupplementaries("dir1\\dir2\\"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1069
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1070
        pattern = Pattern.compile(toSupplementaries("(\\Qdir1\\dir2")+"\\\\E)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1071
        check(pattern, toSupplementaries("dir1\\dir2\\"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1072
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1073
        report("Escaped segment");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1074
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1075
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1076
    // This test is for 4792284
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1077
    private static void nonCaptureRepetitionTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1078
        String input = "abcdefgh;";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1079
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1080
        String[] patterns = new String[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1081
            "(?:\\w{4})+;",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1082
            "(?:\\w{8})*;",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1083
            "(?:\\w{2}){2,4};",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1084
            "(?:\\w{4}){2,};",   // only matches the
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1085
            ".*?(?:\\w{5})+;",   //     specified minimum
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1086
            ".*?(?:\\w{9})*;",   //     number of reps - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1087
            "(?:\\w{4})+?;",     // lazy repetition - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1088
            "(?:\\w{4})++;",     // possessive repetition - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1089
            "(?:\\w{2,}?)+;",    // non-deterministic - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1090
            "(\\w{4})+;",        // capturing group - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1091
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1092
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1093
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1094
            // Check find()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1095
            check(patterns[i], 0, input, input, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1096
            // Check matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1097
            Pattern p = Pattern.compile(patterns[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1098
            Matcher m = p.matcher(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1099
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1100
            if (m.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1101
                if (!m.group(0).equals(input))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1102
                    failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1103
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1104
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1105
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1106
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1107
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1108
        report("Non capturing repetition");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1109
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1110
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1111
    // This test is for 6358731
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1112
    private static void notCapturedGroupCurlyMatchTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1113
        Pattern pattern = Pattern.compile("(abc)+|(abcd)+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1114
        Matcher matcher = pattern.matcher("abcd");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1115
        if (!matcher.matches() ||
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1116
             matcher.group(1) != null ||
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1117
             !matcher.group(2).equals("abcd")) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1118
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1119
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1120
        report("Not captured GroupCurly");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1121
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1122
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1123
    // This test is for 4706545
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1124
    private static void javaCharClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1125
        for (int i=0; i<1000; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1126
            char c = (char)generator.nextInt();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1127
            check("{javaLowerCase}", c, Character.isLowerCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1128
            check("{javaUpperCase}", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1129
            check("{javaUpperCase}+", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1130
            check("{javaTitleCase}", c, Character.isTitleCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1131
            check("{javaDigit}", c, Character.isDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1132
            check("{javaDefined}", c, Character.isDefined(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1133
            check("{javaLetter}", c, Character.isLetter(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1134
            check("{javaLetterOrDigit}", c, Character.isLetterOrDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1135
            check("{javaJavaIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1136
                  Character.isJavaIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1137
            check("{javaJavaIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1138
                  Character.isJavaIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1139
            check("{javaUnicodeIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1140
                  Character.isUnicodeIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1141
            check("{javaUnicodeIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1142
                  Character.isUnicodeIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1143
            check("{javaIdentifierIgnorable}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1144
                  Character.isIdentifierIgnorable(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1145
            check("{javaSpaceChar}", c, Character.isSpaceChar(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1146
            check("{javaWhitespace}", c, Character.isWhitespace(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1147
            check("{javaISOControl}", c, Character.isISOControl(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1148
            check("{javaMirrored}", c, Character.isMirrored(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1149
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1150
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1151
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1152
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1153
        for (int i=0; i<1000; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1154
            int c = generator.nextInt(Character.MAX_CODE_POINT
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1155
                                      - Character.MIN_SUPPLEMENTARY_CODE_POINT)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1156
                        + Character.MIN_SUPPLEMENTARY_CODE_POINT;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1157
            check("{javaLowerCase}", c, Character.isLowerCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1158
            check("{javaUpperCase}", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1159
            check("{javaUpperCase}+", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1160
            check("{javaTitleCase}", c, Character.isTitleCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1161
            check("{javaDigit}", c, Character.isDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1162
            check("{javaDefined}", c, Character.isDefined(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1163
            check("{javaLetter}", c, Character.isLetter(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1164
            check("{javaLetterOrDigit}", c, Character.isLetterOrDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1165
            check("{javaJavaIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1166
                  Character.isJavaIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1167
            check("{javaJavaIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1168
                  Character.isJavaIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1169
            check("{javaUnicodeIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1170
                  Character.isUnicodeIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1171
            check("{javaUnicodeIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1172
                  Character.isUnicodeIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1173
            check("{javaIdentifierIgnorable}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1174
                  Character.isIdentifierIgnorable(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1175
            check("{javaSpaceChar}", c, Character.isSpaceChar(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1176
            check("{javaWhitespace}", c, Character.isWhitespace(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1177
            check("{javaISOControl}", c, Character.isISOControl(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1178
            check("{javaMirrored}", c, Character.isMirrored(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1179
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1180
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1181
        report("Java character classes");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1182
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1183
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1184
    // This test is for 4523620
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1185
    /*
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1186
    private static void numOccurrencesTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1187
        Pattern pattern = Pattern.compile("aaa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1188
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1189
        if (pattern.numOccurrences("aaaaaa", false) != 2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1190
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1191
        if (pattern.numOccurrences("aaaaaa", true) != 4)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1192
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1193
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1194
        pattern = Pattern.compile("^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1195
        if (pattern.numOccurrences("aaaaaa", false) != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1196
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1197
        if (pattern.numOccurrences("aaaaaa", true) != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1198
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1199
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1200
        report("Number of Occurrences");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1201
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1202
    */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1203
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1204
    // This test is for 4776374
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1205
    private static void caretBetweenTerminatorsTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1206
        int flags1 = Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1207
        int flags2 = Pattern.DOTALL | Pattern.UNIX_LINES;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1208
        int flags3 = Pattern.DOTALL | Pattern.UNIX_LINES | Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1209
        int flags4 = Pattern.DOTALL | Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1210
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1211
        check("^....", flags1, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1212
        check(".....^", flags1, "test\ntest", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1213
        check(".....^", flags1, "test\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1214
        check("....^", flags1, "test\r\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1215
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1216
        check("^....", flags2, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1217
        check("....^", flags2, "test\ntest", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1218
        check(".....^", flags2, "test\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1219
        check("....^", flags2, "test\r\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1220
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1221
        check("^....", flags3, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1222
        check(".....^", flags3, "test\ntest", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1223
        check(".....^", flags3, "test\u0085test", "test\u0085", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1224
        check(".....^", flags3, "test\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1225
        check(".....^", flags3, "test\r\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1226
        check("......^", flags3, "test\r\ntest", "test\r\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1227
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1228
        check("^....", flags4, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1229
        check(".....^", flags3, "test\ntest", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1230
        check(".....^", flags4, "test\u0085test", "test\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1231
        check(".....^", flags4, "test\n", "test\n", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1232
        check(".....^", flags4, "test\r\n", "test\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1233
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1234
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1235
        String t = toSupplementaries("test");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1236
        check("^....", flags1, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1237
        check(".....^", flags1, t+"\n"+t, t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1238
        check(".....^", flags1, t+"\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1239
        check("....^", flags1, t+"\r\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1240
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1241
        check("^....", flags2, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1242
        check("....^", flags2, t+"\n"+t, t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1243
        check(".....^", flags2, t+"\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1244
        check("....^", flags2, t+"\r\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1245
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1246
        check("^....", flags3, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1247
        check(".....^", flags3, t+"\n"+t, t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1248
        check(".....^", flags3, t+"\u0085"+t, t+"\u0085", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1249
        check(".....^", flags3, t+"\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1250
        check(".....^", flags3, t+"\r\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1251
        check("......^", flags3, t+"\r\n"+t, t+"\r\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1252
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1253
        check("^....", flags4, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1254
        check(".....^", flags3, t+"\n"+t, t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1255
        check(".....^", flags4, t+"\u0085"+t, t+"\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1256
        check(".....^", flags4, t+"\n", t+"\n", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1257
        check(".....^", flags4, t+"\r\n", t+"\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1258
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1259
        report("Caret between terminators");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1260
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1261
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1262
    // This test is for 4727935
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1263
    private static void dollarAtEndTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1264
        int flags1 = Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1265
        int flags2 = Pattern.DOTALL | Pattern.UNIX_LINES;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1266
        int flags3 = Pattern.DOTALL | Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1267
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1268
        check("....$", flags1, "test\n", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1269
        check("....$", flags1, "test\r\n", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1270
        check(".....$", flags1, "test\n", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1271
        check(".....$", flags1, "test\u0085", "test\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1272
        check("....$", flags1, "test\u0085", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1273
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1274
        check("....$", flags2, "test\n", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1275
        check(".....$", flags2, "test\n", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1276
        check(".....$", flags2, "test\u0085", "test\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1277
        check("....$", flags2, "test\u0085", "est\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1278
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1279
        check("....$.blah", flags3, "test\nblah", "test\nblah", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1280
        check(".....$.blah", flags3, "test\n\nblah", "test\n\nblah", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1281
        check("....$blah", flags3, "test\nblah", "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1282
        check(".....$blah", flags3, "test\nblah", "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1283
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1284
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1285
        String t = toSupplementaries("test");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1286
        String b = toSupplementaries("blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1287
        check("....$", flags1, t+"\n", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1288
        check("....$", flags1, t+"\r\n", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1289
        check(".....$", flags1, t+"\n", t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1290
        check(".....$", flags1, t+"\u0085", t+"\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1291
        check("....$", flags1, t+"\u0085", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1292
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1293
        check("....$", flags2, t+"\n", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1294
        check(".....$", flags2, t+"\n", t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1295
        check(".....$", flags2, t+"\u0085", t+"\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1296
        check("....$", flags2, t+"\u0085", toSupplementaries("est\u0085"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1297
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1298
        check("....$."+b, flags3, t+"\n"+b, t+"\n"+b, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1299
        check(".....$."+b, flags3, t+"\n\n"+b, t+"\n\n"+b, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1300
        check("....$"+b, flags3, t+"\n"+b, "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1301
        check(".....$"+b, flags3, t+"\n"+b, "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1302
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1303
        report("Dollar at End");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1304
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1305
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1306
    // This test is for 4711773
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1307
    private static void multilineDollarTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1308
        Pattern findCR = Pattern.compile("$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1309
        Matcher matcher = findCR.matcher("first bit\nsecond bit");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1310
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1311
        if (matcher.start(0) != 9)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1312
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1313
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1314
        if (matcher.start(0) != 20)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1315
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1316
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1317
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1318
        matcher = findCR.matcher(toSupplementaries("first  bit\n second  bit")); // double BMP chars
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1319
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1320
        if (matcher.start(0) != 9*2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1321
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1322
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1323
        if (matcher.start(0) != 20*2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1324
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1325
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1326
        report("Multiline Dollar");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1327
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1328
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1329
    private static void reluctantRepetitionTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1330
        Pattern p = Pattern.compile("1(\\s\\S+?){1,3}?[\\s,]2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1331
        check(p, "1 word word word 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1332
        check(p, "1 wor wo w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1333
        check(p, "1 word word 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1334
        check(p, "1 word 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1335
        check(p, "1 wo w w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1336
        check(p, "1 wo w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1337
        check(p, "1 wor w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1338
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1339
        p = Pattern.compile("([a-z])+?c");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1340
        Matcher m = p.matcher("ababcdefdec");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1341
        check(m, "ababc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1342
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1343
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1344
        p = Pattern.compile(toSupplementaries("([a-z])+?c"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1345
        m = p.matcher(toSupplementaries("ababcdefdec"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1346
        check(m, toSupplementaries("ababc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1347
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1348
        report("Reluctant Repetition");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1349
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1350
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1351
    private static void serializeTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1352
        String patternStr = "(b)";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1353
        String matchStr = "b";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1354
        Pattern pattern = Pattern.compile(patternStr);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1355
        ByteArrayOutputStream baos = new ByteArrayOutputStream();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1356
        ObjectOutputStream oos = new ObjectOutputStream(baos);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1357
        oos.writeObject(pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1358
        oos.close();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1359
        ObjectInputStream ois = new ObjectInputStream(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1360
            new ByteArrayInputStream(baos.toByteArray()));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1361
        Pattern serializedPattern = (Pattern)ois.readObject();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1362
        ois.close();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1363
        Matcher matcher = serializedPattern.matcher(matchStr);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1364
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1365
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1366
        if (matcher.groupCount() != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1367
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1368
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1369
        report("Serialization");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1370
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1371
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1372
    private static void gTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1373
        Pattern pattern = Pattern.compile("\\G\\w");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1374
        Matcher matcher = pattern.matcher("abc#x#x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1375
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1376
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1377
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1378
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1379
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1380
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1381
        pattern = Pattern.compile("\\GA*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1382
        matcher = pattern.matcher("1A2AA3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1383
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1384
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1385
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1386
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1387
        pattern = Pattern.compile("\\GA*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1388
        matcher = pattern.matcher("1A2AA3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1389
        if (!matcher.find(1))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1390
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1391
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1392
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1393
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1394
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1395
        report("\\G");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1396
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1397
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1398
    private static void zTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1399
        Pattern pattern = Pattern.compile("foo\\Z");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1400
        // Positives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1401
        check(pattern, "foo\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1402
        check(pattern, "foo\u2028", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1403
        check(pattern, "foo\u2029", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1404
        check(pattern, "foo\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1405
        check(pattern, "foo\r", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1406
        check(pattern, "foo\r\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1407
        // Negatives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1408
        check(pattern, "fooo", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1409
        check(pattern, "foo\n\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1410
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1411
        pattern = Pattern.compile("foo\\Z", Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1412
        // Positives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1413
        check(pattern, "foo", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1414
        check(pattern, "foo\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1415
        // Negatives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1416
        check(pattern, "foo\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1417
        check(pattern, "foo\u0085", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1418
        check(pattern, "foo\u2028", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1419
        check(pattern, "foo\u2029", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1420
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1421
        report("\\Z");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1422
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1423
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1424
    private static void replaceFirstTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1425
        Pattern pattern = Pattern.compile("(ab)(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1426
        Matcher matcher = pattern.matcher("abccczzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1427
        if (!matcher.replaceFirst("test").equals("testzzzabcczzzabccc"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1428
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1429
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1430
        matcher.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1431
        if (!matcher.replaceFirst("test").equals("zzztestzzzabcczzzabccczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1432
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1433
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1434
        matcher.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1435
        String result = matcher.replaceFirst("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1436
        if (!result.equals("zzzabzzzabcczzzabccczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1437
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1438
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1439
        matcher.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1440
        result = matcher.replaceFirst("$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1441
        if (!result.equals("zzzccczzzabcczzzabccczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1442
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1443
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1444
        pattern = Pattern.compile("a*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1445
        matcher = pattern.matcher("aaaaaaaaaa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1446
        if (!matcher.replaceFirst("test").equals("test"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1447
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1448
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1449
        pattern = Pattern.compile("a+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1450
        matcher = pattern.matcher("zzzaaaaaaaaaa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1451
        if (!matcher.replaceFirst("test").equals("zzztest"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1452
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1453
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1454
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1455
        pattern = Pattern.compile(toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1456
        matcher = pattern.matcher(toSupplementaries("abccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1457
        if (!matcher.replaceFirst(toSupplementaries("test"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1458
                .equals(toSupplementaries("testzzzabcczzzabccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1459
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1460
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1461
        matcher.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1462
        if (!matcher.replaceFirst(toSupplementaries("test")).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1463
            equals(toSupplementaries("zzztestzzzabcczzzabccczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1464
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1465
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1466
        matcher.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1467
        result = matcher.replaceFirst("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1468
        if (!result.equals(toSupplementaries("zzzabzzzabcczzzabccczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1469
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1470
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1471
        matcher.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1472
        result = matcher.replaceFirst("$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1473
        if (!result.equals(toSupplementaries("zzzccczzzabcczzzabccczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1474
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1475
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1476
        pattern = Pattern.compile(toSupplementaries("a*"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1477
        matcher = pattern.matcher(toSupplementaries("aaaaaaaaaa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1478
        if (!matcher.replaceFirst(toSupplementaries("test")).equals(toSupplementaries("test")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1479
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1480
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1481
        pattern = Pattern.compile(toSupplementaries("a+"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1482
        matcher = pattern.matcher(toSupplementaries("zzzaaaaaaaaaa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1483
        if (!matcher.replaceFirst(toSupplementaries("test")).equals(toSupplementaries("zzztest")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1484
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1485
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1486
        report("Replace First");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1487
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1488
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1489
    private static void unixLinesTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1490
        Pattern pattern = Pattern.compile(".*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1491
        Matcher matcher = pattern.matcher("aa\u2028blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1492
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1493
        if (!matcher.group(0).equals("aa"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1494
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1495
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1496
        pattern = Pattern.compile(".*", Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1497
        matcher = pattern.matcher("aa\u2028blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1498
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1499
        if (!matcher.group(0).equals("aa\u2028blah"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1500
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1501
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1502
        pattern = Pattern.compile("[az]$",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1503
                                  Pattern.MULTILINE | Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1504
        matcher = pattern.matcher("aa\u2028zz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1505
        check(matcher, "a\u2028", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1506
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1507
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1508
        pattern = Pattern.compile(".*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1509
        matcher = pattern.matcher(toSupplementaries("aa\u2028blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1510
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1511
        if (!matcher.group(0).equals(toSupplementaries("aa")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1512
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1513
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1514
        pattern = Pattern.compile(".*", Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1515
        matcher = pattern.matcher(toSupplementaries("aa\u2028blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1516
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1517
        if (!matcher.group(0).equals(toSupplementaries("aa\u2028blah")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1518
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1519
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1520
        pattern = Pattern.compile(toSupplementaries("[az]$"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1521
                                  Pattern.MULTILINE | Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1522
        matcher = pattern.matcher(toSupplementaries("aa\u2028zz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1523
        check(matcher, toSupplementaries("a\u2028"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1524
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1525
        report("Unix Lines");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1526
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1527
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1528
    private static void commentsTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1529
        int flags = Pattern.COMMENTS;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1530
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1531
        Pattern pattern = Pattern.compile("aa \\# aa", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1532
        Matcher matcher = pattern.matcher("aa#aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1533
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1534
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1535
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1536
        pattern = Pattern.compile("aa  # blah", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1537
        matcher = pattern.matcher("aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1538
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1539
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1540
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1541
        pattern = Pattern.compile("aa blah", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1542
        matcher = pattern.matcher("aablah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1543
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1544
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1545
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1546
        pattern = Pattern.compile("aa  # blah blech  ", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1547
        matcher = pattern.matcher("aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1548
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1549
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1550
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1551
        pattern = Pattern.compile("aa  # blah\n  ", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1552
        matcher = pattern.matcher("aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1553
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1554
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1555
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1556
        pattern = Pattern.compile("aa  # blah\nbc # blech", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1557
        matcher = pattern.matcher("aabc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1558
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1559
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1560
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1561
        pattern = Pattern.compile("aa  # blah\nbc# blech", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1562
        matcher = pattern.matcher("aabc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1563
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1564
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1565
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1566
        pattern = Pattern.compile("aa  # blah\nbc\\# blech", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1567
        matcher = pattern.matcher("aabc#blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1568
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1569
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1570
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1571
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1572
        pattern = Pattern.compile(toSupplementaries("aa \\# aa"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1573
        matcher = pattern.matcher(toSupplementaries("aa#aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1574
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1575
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1576
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1577
        pattern = Pattern.compile(toSupplementaries("aa  # blah"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1578
        matcher = pattern.matcher(toSupplementaries("aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1579
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1580
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1581
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1582
        pattern = Pattern.compile(toSupplementaries("aa blah"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1583
        matcher = pattern.matcher(toSupplementaries("aablah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1584
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1585
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1586
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1587
        pattern = Pattern.compile(toSupplementaries("aa  # blah blech  "), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1588
        matcher = pattern.matcher(toSupplementaries("aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1589
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1590
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1591
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1592
        pattern = Pattern.compile(toSupplementaries("aa  # blah\n  "), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1593
        matcher = pattern.matcher(toSupplementaries("aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1594
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1595
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1596
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1597
        pattern = Pattern.compile(toSupplementaries("aa  # blah\nbc # blech"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1598
        matcher = pattern.matcher(toSupplementaries("aabc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1599
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1600
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1601
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1602
        pattern = Pattern.compile(toSupplementaries("aa  # blah\nbc# blech"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1603
        matcher = pattern.matcher(toSupplementaries("aabc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1604
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1605
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1606
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1607
        pattern = Pattern.compile(toSupplementaries("aa  # blah\nbc\\# blech"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1608
        matcher = pattern.matcher(toSupplementaries("aabc#blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1609
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1610
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1611
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1612
        report("Comments");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1613
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1614
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1615
    private static void caseFoldingTest() { // bug 4504687
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1616
        int flags = Pattern.CASE_INSENSITIVE | Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1617
        Pattern pattern = Pattern.compile("aa", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1618
        Matcher matcher = pattern.matcher("ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1619
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1620
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1621
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1622
        pattern = Pattern.compile("aA", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1623
        matcher = pattern.matcher("ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1624
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1625
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1626
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1627
        pattern = Pattern.compile("aa", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1628
        matcher = pattern.matcher("aB");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1629
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1630
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1631
        matcher = pattern.matcher("Ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1632
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1633
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1634
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1635
        // ASCII               "a"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1636
        // Latin-1 Supplement  "a" + grave
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1637
        // Cyrillic            "a"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1638
        String[] patterns = new String[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1639
            //single
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1640
            "a", "\u00e0", "\u0430",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1641
            //slice
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1642
            "ab", "\u00e0\u00e1", "\u0430\u0431",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1643
            //class single
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1644
            "[a]", "[\u00e0]", "[\u0430]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1645
            //class range
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1646
            "[a-b]", "[\u00e0-\u00e5]", "[\u0430-\u0431]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1647
            //back reference
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1648
            "(a)\\1", "(\u00e0)\\1", "(\u0430)\\1"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1649
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1650
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1651
        String[] texts = new String[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1652
            "A", "\u00c0", "\u0410",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1653
            "AB", "\u00c0\u00c1", "\u0410\u0411",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1654
            "A", "\u00c0", "\u0410",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1655
            "B", "\u00c2", "\u0411",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1656
            "aA", "\u00e0\u00c0", "\u0430\u0410"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1657
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1658
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1659
        boolean[] expected = new boolean[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1660
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1661
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1662
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1663
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1664
            true, false, false
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1665
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1666
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1667
        flags = Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1668
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1669
            pattern = Pattern.compile(patterns[i], flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1670
            matcher = pattern.matcher(texts[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1671
            if (matcher.matches() != expected[i]) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1672
                System.out.println("<1> Failed at " + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1673
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1674
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1675
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1676
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1677
        flags = Pattern.CASE_INSENSITIVE | Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1678
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1679
            pattern = Pattern.compile(patterns[i], flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1680
            matcher = pattern.matcher(texts[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1681
            if (!matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1682
                System.out.println("<2> Failed at " + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1683
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1684
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1685
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1686
        // flag unicode_case alone should do nothing
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1687
        flags = Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1688
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1689
            pattern = Pattern.compile(patterns[i], flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1690
            matcher = pattern.matcher(texts[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1691
            if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1692
                System.out.println("<3> Failed at " + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1693
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1694
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1695
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1696
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1697
        // Special cases: i, I, u+0131 and u+0130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1698
        flags = Pattern.UNICODE_CASE | Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1699
        pattern = Pattern.compile("[h-j]+", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1700
        if (!pattern.matcher("\u0131\u0130").matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1701
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1702
        report("Case Folding");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1703
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1704
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1705
    private static void appendTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1706
        Pattern pattern = Pattern.compile("(ab)(cd)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1707
        Matcher matcher = pattern.matcher("abcd");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1708
        String result = matcher.replaceAll("$2$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1709
        if (!result.equals("cdab"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1710
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1711
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1712
        String  s1 = "Swap all: first = 123, second = 456";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1713
        String  s2 = "Swap one: first = 123, second = 456";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1714
        String  r  = "$3$2$1";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1715
        pattern = Pattern.compile("([a-z]+)( *= *)([0-9]+)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1716
        matcher = pattern.matcher(s1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1717
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1718
        result = matcher.replaceAll(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1719
        if (!result.equals("Swap all: 123 = first, 456 = second"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1720
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1721
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1722
        matcher = pattern.matcher(s2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1723
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1724
        if (matcher.find()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1725
            StringBuffer sb = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1726
            matcher.appendReplacement(sb, r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1727
            matcher.appendTail(sb);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1728
            result = sb.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1729
            if (!result.equals("Swap one: 123 = first, second = 456"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1730
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1731
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1732
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1733
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1734
        pattern = Pattern.compile(toSupplementaries("(ab)(cd)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1735
        matcher = pattern.matcher(toSupplementaries("abcd"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1736
        result = matcher.replaceAll("$2$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1737
        if (!result.equals(toSupplementaries("cdab")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1738
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1739
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1740
        s1 = toSupplementaries("Swap all: first = 123, second = 456");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1741
        s2 = toSupplementaries("Swap one: first = 123, second = 456");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1742
        r  = toSupplementaries("$3$2$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1743
        pattern = Pattern.compile(toSupplementaries("([a-z]+)( *= *)([0-9]+)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1744
        matcher = pattern.matcher(s1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1745
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1746
        result = matcher.replaceAll(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1747
        if (!result.equals(toSupplementaries("Swap all: 123 = first, 456 = second")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1748
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1749
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1750
        matcher = pattern.matcher(s2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1751
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1752
        if (matcher.find()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1753
            StringBuffer sb = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1754
            matcher.appendReplacement(sb, r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1755
            matcher.appendTail(sb);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1756
            result = sb.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1757
            if (!result.equals(toSupplementaries("Swap one: 123 = first, second = 456")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1758
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1759
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1760
        report("Append");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1761
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1762
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1763
    private static void splitTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1764
        Pattern pattern = Pattern.compile(":");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1765
        String[] result = pattern.split("foo:and:boo", 2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1766
        if (!result[0].equals("foo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1767
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1768
        if (!result[1].equals("and:boo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1769
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1770
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1771
        Pattern patternX = Pattern.compile(toSupplementaries("X"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1772
        result = patternX.split(toSupplementaries("fooXandXboo"), 2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1773
        if (!result[0].equals(toSupplementaries("foo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1774
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1775
        if (!result[1].equals(toSupplementaries("andXboo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1776
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1777
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1778
        CharBuffer cb = CharBuffer.allocate(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1779
        cb.put("foo:and:boo");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1780
        cb.flip();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1781
        result = pattern.split(cb);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1782
        if (!result[0].equals("foo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1783
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1784
        if (!result[1].equals("and"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1785
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1786
        if (!result[2].equals("boo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1787
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1788
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1789
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1790
        CharBuffer cbs = CharBuffer.allocate(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1791
        cbs.put(toSupplementaries("fooXandXboo"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1792
        cbs.flip();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1793
        result = patternX.split(cbs);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1794
        if (!result[0].equals(toSupplementaries("foo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1795
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1796
        if (!result[1].equals(toSupplementaries("and")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1797
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1798
        if (!result[2].equals(toSupplementaries("boo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1799
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1800
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1801
        String source = "0123456789";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1802
        for (int limit=-2; limit<3; limit++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1803
            for (int x=0; x<10; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1804
                result = source.split(Integer.toString(x), limit);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1805
                int expectedLength = limit < 1 ? 2 : limit;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1806
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1807
                if ((limit == 0) && (x == 9)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1808
                    // expected dropping of ""
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1809
                    if (result.length != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1810
                        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1811
                    if (!result[0].equals("012345678")) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1812
                        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1813
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1814
                } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1815
                    if (result.length != expectedLength) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1816
                        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1817
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1818
                    if (!result[0].equals(source.substring(0,x))) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1819
                        if (limit != 1) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1820
                            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1821
                        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1822
                            if (!result[0].equals(source.substring(0,10))) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1823
                                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1824
                            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1825
                        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1826
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1827
                    if (expectedLength > 1) { // Check segment 2
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1828
                        if (!result[1].equals(source.substring(x+1,10)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1829
                            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1830
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1831
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1832
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1833
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1834
        // Check the case for no match found
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1835
        for (int limit=-2; limit<3; limit++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1836
            result = source.split("e", limit);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1837
            if (result.length != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1838
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1839
            if (!result[0].equals(source))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1840
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1841
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1842
        // Check the case for limit == 0, source = "";
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1843
        // split() now returns 0-length for empty source "" see #6559590
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1844
        source = "";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1845
        result = source.split("e", 0);
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1846
        if (result.length != 1)
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1847
            failCount++;
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1848
        if (!result[0].equals(source))
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1849
            failCount++;
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1850
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1851
        // Check both split() and splitAsStraem(), especially for zero-lenth
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1852
        // input and zero-lenth match cases
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1853
        String[][] input = new String[][] {
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1854
            { " ",           "Abc Efg Hij" },   // normal non-zero-match
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1855
            { " ",           " Abc Efg Hij" },  // leading empty str for non-zero-match
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1856
            { " ",           "Abc  Efg Hij" },  // non-zero-match in the middle
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1857
            { "(?=\\p{Lu})", "AbcEfgHij" },     // no leading empty str for zero-match
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1858
            { "(?=\\p{Lu})", "AbcEfg" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1859
            { "(?=\\p{Lu})", "Abc" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1860
            { " ",           "" },              // zero-length input
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1861
            { ".*",          "" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1862
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1863
            // some tests from PatternStreamTest.java
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1864
            { "4",       "awgqwefg1fefw4vssv1vvv1" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1865
            { "\u00a3a", "afbfq\u00a3abgwgb\u00a3awngnwggw\u00a3a\u00a3ahjrnhneerh" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1866
            { "1",       "awgqwefg1fefw4vssv1vvv1" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1867
            { "1",       "a\u4ebafg1fefw\u4eba4\u9f9cvssv\u9f9c1v\u672c\u672cvv" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1868
            { "\u56da",  "1\u56da23\u56da456\u56da7890" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1869
            { "\u56da",  "1\u56da23\u9f9c\u672c\u672c\u56da456\u56da\u9f9c\u672c7890" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1870
            { "\u56da",  "" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1871
            { "[ \t,:.]","This is,testing: with\tdifferent separators." }, //multiple septs
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1872
            { "o",       "boo:and:foo" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1873
            { "o",       "booooo:and:fooooo" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1874
            { "o",       "fooooo:" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1875
        };
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1876
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1877
        String[][] expected = new String[][] {
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1878
            { "Abc", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1879
            { "", "Abc", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1880
            { "Abc", "", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1881
            { "Abc", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1882
            { "Abc", "Efg" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1883
            { "Abc" },
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1884
            { "" },
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1885
            { "" },
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1886
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1887
            { "awgqwefg1fefw", "vssv1vvv1" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1888
            { "afbfq", "bgwgb", "wngnwggw", "", "hjrnhneerh" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1889
            { "awgqwefg", "fefw4vssv", "vvv" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1890
            { "a\u4ebafg", "fefw\u4eba4\u9f9cvssv\u9f9c", "v\u672c\u672cvv" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1891
            { "1", "23", "456", "7890" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1892
            { "1", "23\u9f9c\u672c\u672c", "456", "\u9f9c\u672c7890" },
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1893
            { "" },
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1894
            { "This", "is", "testing", "", "with", "different", "separators" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1895
            { "b", "", ":and:f" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1896
            { "b", "", "", "", "", ":and:f" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1897
            { "f", "", "", "", "", ":" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1898
        };
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1899
        for (int i = 0; i < input.length; i++) {
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1900
            pattern = Pattern.compile(input[i][0]);
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1901
            if (!Arrays.equals(pattern.split(input[i][1]), expected[i])) {
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1902
                failCount++;
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1903
            }
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1904
            if (input[i][1].length() > 0 &&  // splitAsStream() return empty resulting
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1905
                                             // array for zero-length input for now
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1906
                !Arrays.equals(pattern.splitAsStream(input[i][1]).toArray(),
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1907
                               expected[i])) {
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1908
                failCount++;
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1909
            }
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1910
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1911
        report("Split");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1912
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1913
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1914
    private static void negationTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1915
        Pattern pattern = Pattern.compile("[\\[@^]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1916
        Matcher matcher = pattern.matcher("@@@@[[[[^^^^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1917
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1918
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1919
        if (!matcher.group(0).equals("@@@@[[[[^^^^"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1920
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1921
        pattern = Pattern.compile("[@\\[^]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1922
        matcher = pattern.matcher("@@@@[[[[^^^^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1923
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1924
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1925
        if (!matcher.group(0).equals("@@@@[[[[^^^^"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1926
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1927
        pattern = Pattern.compile("[@\\[^@]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1928
        matcher = pattern.matcher("@@@@[[[[^^^^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1929
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1930
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1931
        if (!matcher.group(0).equals("@@@@[[[[^^^^"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1932
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1933
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1934
        pattern = Pattern.compile("\\)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1935
        matcher = pattern.matcher("xxx)xxx");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1936
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1937
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1938
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1939
        report("Negation");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1940
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1941
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1942
    private static void ampersandTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1943
        Pattern pattern = Pattern.compile("[&@]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1944
        check(pattern, "@@@@&&&&", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1945
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1946
        pattern = Pattern.compile("[@&]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1947
        check(pattern, "@@@@&&&&", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1948
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1949
        pattern = Pattern.compile("[@\\&]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1950
        check(pattern, "@@@@&&&&", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1951
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1952
        report("Ampersand");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1953
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1954
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1955
    private static void octalTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1956
        Pattern pattern = Pattern.compile("\\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1957
        Matcher matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1958
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1959
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1960
        pattern = Pattern.compile("\\07");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1961
        matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1962
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1963
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1964
        pattern = Pattern.compile("\\007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1965
        matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1966
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1967
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1968
        pattern = Pattern.compile("\\0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1969
        matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1970
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1971
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1972
        pattern = Pattern.compile("\\040");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1973
        matcher = pattern.matcher("\u0020");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1974
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1975
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1976
        pattern = Pattern.compile("\\0403");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1977
        matcher = pattern.matcher("\u00203");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1978
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1979
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1980
        pattern = Pattern.compile("\\0103");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1981
        matcher = pattern.matcher("\u0043");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1982
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1983
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1984
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1985
        report("Octal");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1986
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1987
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1988
    private static void longPatternTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1989
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1990
            Pattern pattern = Pattern.compile(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1991
                "a 32-character-long pattern xxxx");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1992
            pattern = Pattern.compile("a 33-character-long pattern xxxxx");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1993
            pattern = Pattern.compile("a thirty four character long regex");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1994
            StringBuffer patternToBe = new StringBuffer(101);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1995
            for (int i=0; i<100; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1996
                patternToBe.append((char)(97 + i%26));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1997
            pattern = Pattern.compile(patternToBe.toString());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1998
        } catch (PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1999
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2000
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2001
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2002
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2003
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2004
            Pattern pattern = Pattern.compile(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2005
                toSupplementaries("a 32-character-long pattern xxxx"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2006
            pattern = Pattern.compile(toSupplementaries("a 33-character-long pattern xxxxx"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2007
            pattern = Pattern.compile(toSupplementaries("a thirty four character long regex"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2008
            StringBuffer patternToBe = new StringBuffer(101*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2009
            for (int i=0; i<100; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2010
                patternToBe.append(Character.toChars(Character.MIN_SUPPLEMENTARY_CODE_POINT
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2011
                                                     + 97 + i%26));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2012
            pattern = Pattern.compile(patternToBe.toString());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2013
        } catch (PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2014
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2015
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2016
        report("LongPattern");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2017
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2018
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2019
    private static void group0Test() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2020
        Pattern pattern = Pattern.compile("(tes)ting");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2021
        Matcher matcher = pattern.matcher("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2022
        check(matcher, "testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2023
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2024
        matcher.reset("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2025
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2026
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2027
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2028
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2029
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2030
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2031
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2032
        matcher.reset("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2033
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2034
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2035
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2036
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2037
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2038
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2039
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2040
        pattern = Pattern.compile("(tes)ting");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2041
        matcher = pattern.matcher("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2042
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2043
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2044
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2045
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2046
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2047
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2048
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2049
        pattern = Pattern.compile("^(tes)ting");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2050
        matcher = pattern.matcher("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2051
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2052
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2053
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2054
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2055
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2056
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2057
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2058
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2059
        pattern = Pattern.compile(toSupplementaries("(tes)ting"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2060
        matcher = pattern.matcher(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2061
        check(matcher, toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2062
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2063
        matcher.reset(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2064
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2065
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2066
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2067
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2068
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2069
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2071
        matcher.reset(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2072
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2073
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2074
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2075
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2076
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2077
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2078
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2079
        pattern = Pattern.compile(toSupplementaries("(tes)ting"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2080
        matcher = pattern.matcher(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2081
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2082
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2083
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2084
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2085
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2086
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2087
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2088
        pattern = Pattern.compile(toSupplementaries("^(tes)ting"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2089
        matcher = pattern.matcher(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2090
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2091
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2092
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2093
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2094
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2095
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2096
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2097
        report("Group0");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2098
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2099
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2100
    private static void findIntTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2101
        Pattern p = Pattern.compile("blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2102
        Matcher m = p.matcher("zzzzblahzzzzzblah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2103
        boolean result = m.find(2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2104
        if (!result)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2105
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2106
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2107
        p = Pattern.compile("$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2108
        m = p.matcher("1234567890");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2109
        result = m.find(10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2110
        if (!result)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2111
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2112
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2113
            result = m.find(11);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2114
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2115
        } catch (IndexOutOfBoundsException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2116
            // correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2117
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2118
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2119
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2120
        p = Pattern.compile(toSupplementaries("blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2121
        m = p.matcher(toSupplementaries("zzzzblahzzzzzblah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2122
        result = m.find(2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2123
        if (!result)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2124
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2125
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2126
        report("FindInt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2127
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2128
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2129
    private static void emptyPatternTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2130
        Pattern p = Pattern.compile("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2131
        Matcher m = p.matcher("foo");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2132
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2133
        // Should find empty pattern at beginning of input
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2134
        boolean result = m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2135
        if (result != true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2136
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2137
        if (m.start() != 0)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2138
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2139
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2140
        // Should not match entire input if input is not empty
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2141
        m.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2142
        result = m.matches();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2143
        if (result == true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2144
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2145
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2146
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2147
            m.start(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2148
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2149
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2150
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2151
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2152
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2153
        // Should match entire input if input is empty
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2154
        m.reset("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2155
        result = m.matches();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2156
        if (result != true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2157
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2158
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2159
        result = Pattern.matches("", "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2160
        if (result != true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2161
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2162
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2163
        result = Pattern.matches("", "foo");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2164
        if (result == true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2165
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2166
        report("EmptyPattern");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2167
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2168
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2169
    private static void charClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2170
        Pattern pattern = Pattern.compile("blah[ab]]blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2171
        check(pattern, "blahb]blech", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2172
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2173
        pattern = Pattern.compile("[abc[def]]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2174
        check(pattern, "b", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2175
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2176
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2177
        pattern = Pattern.compile(toSupplementaries("blah[ab]]blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2178
        check(pattern, toSupplementaries("blahb]blech"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2179
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2180
        pattern = Pattern.compile(toSupplementaries("[abc[def]]"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2181
        check(pattern, toSupplementaries("b"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2182
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2183
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2184
            // u00ff when UNICODE_CASE
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2185
            pattern = Pattern.compile("[ab\u00ffcd]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2186
                                      Pattern.CASE_INSENSITIVE|
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2187
                                      Pattern.UNICODE_CASE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2188
            check(pattern, "ab\u00ffcd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2189
            check(pattern, "Ab\u0178Cd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2190
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2191
            // u00b5 when UNICODE_CASE
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2192
            pattern = Pattern.compile("[ab\u00b5cd]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2193
                                      Pattern.CASE_INSENSITIVE|
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2194
                                      Pattern.UNICODE_CASE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2195
            check(pattern, "ab\u00b5cd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2196
            check(pattern, "Ab\u039cCd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2197
        } catch (Exception e) { failCount++; }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2198
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2199
        /* Special cases
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2200
           (1)LatinSmallLetterLongS u+017f
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2201
           (2)LatinSmallLetterDotlessI u+0131
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2202
           (3)LatineCapitalLetterIWithDotAbove u+0130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2203
           (4)KelvinSign u+212a
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2204
           (5)AngstromSign u+212b
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2205
        */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2206
        int flags = Pattern.UNICODE_CASE | Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2207
        pattern = Pattern.compile("[sik\u00c5]+", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2208
        if (!pattern.matcher("\u017f\u0130\u0131\u212a\u212b").matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2209
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2210
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2211
        report("CharClass");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2212
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2213
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2214
    private static void caretTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2215
        Pattern pattern = Pattern.compile("\\w*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2216
        Matcher matcher = pattern.matcher("a#bc#def##g");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2217
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2218
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2219
        check(matcher, "bc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2220
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2221
        check(matcher, "def");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2222
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2223
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2224
        check(matcher, "g");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2225
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2226
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2227
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2228
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2229
        pattern = Pattern.compile("^\\w*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2230
        matcher = pattern.matcher("a#bc#def##g");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2231
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2232
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2233
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2234
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2235
        pattern = Pattern.compile("\\w");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2236
        matcher = pattern.matcher("abc##x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2237
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2238
        check(matcher, "b");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2239
        check(matcher, "c");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2240
        check(matcher, "x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2241
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2242
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2243
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2244
        pattern = Pattern.compile("^\\w");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2245
        matcher = pattern.matcher("abc##x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2246
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2247
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2248
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2249
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2250
        pattern = Pattern.compile("\\A\\p{Alpha}{3}");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2251
        matcher = pattern.matcher("abcdef-ghi\njklmno");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2252
        check(matcher, "abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2253
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2254
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2255
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2256
        pattern = Pattern.compile("^\\p{Alpha}{3}", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2257
        matcher = pattern.matcher("abcdef-ghi\njklmno");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2258
        check(matcher, "abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2259
        check(matcher, "jkl");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2260
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2261
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2262
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2263
        pattern = Pattern.compile("^", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2264
        matcher = pattern.matcher("this is some text");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2265
        String result = matcher.replaceAll("X");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2266
        if (!result.equals("Xthis is some text"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2267
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2268
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2269
        pattern = Pattern.compile("^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2270
        matcher = pattern.matcher("this is some text");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2271
        result = matcher.replaceAll("X");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2272
        if (!result.equals("Xthis is some text"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2273
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2274
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2275
        pattern = Pattern.compile("^", Pattern.MULTILINE | Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2276
        matcher = pattern.matcher("this is some text\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2277
        result = matcher.replaceAll("X");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2278
        if (!result.equals("Xthis is some text\n"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2279
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2280
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2281
        report("Caret");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2282
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2283
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2284
    private static void groupCaptureTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2285
        // Independent group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2286
        Pattern pattern = Pattern.compile("x+(?>y+)z+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2287
        Matcher matcher = pattern.matcher("xxxyyyzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2288
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2289
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2290
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2291
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2292
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2293
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2294
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2295
        // Pure group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2296
        pattern = Pattern.compile("x+(?:y+)z+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2297
        matcher = pattern.matcher("xxxyyyzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2298
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2299
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2300
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2301
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2302
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2303
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2304
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2305
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2306
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2307
        // Independent group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2308
        pattern = Pattern.compile(toSupplementaries("x+(?>y+)z+"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2309
        matcher = pattern.matcher(toSupplementaries("xxxyyyzzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2310
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2311
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2312
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2313
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2314
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2315
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2316
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2317
        // Pure group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2318
        pattern = Pattern.compile(toSupplementaries("x+(?:y+)z+"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2319
        matcher = pattern.matcher(toSupplementaries("xxxyyyzzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2320
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2321
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2322
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2323
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2324
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2325
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2326
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2327
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2328
        report("GroupCapture");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2329
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2330
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2331
    private static void backRefTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2332
        Pattern pattern = Pattern.compile("(a*)bc\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2333
        check(pattern, "zzzaabcazzz", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2334
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2335
        pattern = Pattern.compile("(a*)bc\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2336
        check(pattern, "zzzaabcaazzz", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2337
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2338
        pattern = Pattern.compile("(abc)(def)\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2339
        check(pattern, "abcdefabc", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2340
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2341
        pattern = Pattern.compile("(abc)(def)\\3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2342
        check(pattern, "abcdefabc", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2343
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2344
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2345
            for (int i = 1; i < 10; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2346
                // Make sure backref 1-9 are always accepted
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2347
                pattern = Pattern.compile("abcdef\\" + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2348
                // and fail to match if the target group does not exit
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2349
                check(pattern, "abcdef", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2350
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2351
        } catch(PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2352
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2353
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2354
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2355
        pattern = Pattern.compile("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)\\11");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2356
        check(pattern, "abcdefghija", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2357
        check(pattern, "abcdefghija1", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2358
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2359
        pattern = Pattern.compile("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)(k)\\11");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2360
        check(pattern, "abcdefghijkk", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2361
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2362
        pattern = Pattern.compile("(a)bcdefghij\\11");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2363
        check(pattern, "abcdefghija1", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2364
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2365
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2366
        pattern = Pattern.compile(toSupplementaries("(a*)bc\\1"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2367
        check(pattern, toSupplementaries("zzzaabcazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2368
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2369
        pattern = Pattern.compile(toSupplementaries("(a*)bc\\1"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2370
        check(pattern, toSupplementaries("zzzaabcaazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2371
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2372
        pattern = Pattern.compile(toSupplementaries("(abc)(def)\\1"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2373
        check(pattern, toSupplementaries("abcdefabc"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2374
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2375
        pattern = Pattern.compile(toSupplementaries("(abc)(def)\\3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2376
        check(pattern, toSupplementaries("abcdefabc"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2377
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2378
        pattern = Pattern.compile(toSupplementaries("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)\\11"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2379
        check(pattern, toSupplementaries("abcdefghija"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2380
        check(pattern, toSupplementaries("abcdefghija1"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2381
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2382
        pattern = Pattern.compile(toSupplementaries("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)(k)\\11"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2383
        check(pattern, toSupplementaries("abcdefghijkk"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2384
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2385
        report("BackRef");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2386
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2387
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2388
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2389
     * Unicode Technical Report #18, section 2.6 End of Line
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2390
     * There is no empty line to be matched in the sequence \u000D\u000A
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2391
     * but there is an empty line in the sequence \u000A\u000D.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2392
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2393
    private static void anchorTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2394
        Pattern p = Pattern.compile("^.*$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2395
        Matcher m = p.matcher("blah1\r\nblah2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2396
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2397
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2398
        if (!m.group().equals("blah2"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2399
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2400
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2401
        m.reset("blah1\n\rblah2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2402
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2403
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2404
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2405
        if (!m.group().equals("blah2"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2406
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2407
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2408
        // Test behavior of $ with \r\n at end of input
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2409
        p = Pattern.compile(".+$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2410
        m = p.matcher("blah1\r\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2411
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2412
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2413
       if (!m.group().equals("blah1"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2414
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2415
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2416
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2417
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2418
        // Test behavior of $ with \r\n at end of input in multiline
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2419
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2420
        m = p.matcher("blah1\r\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2421
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2422
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2423
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2424
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2425
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2426
        // Test for $ recognition of \u0085 for bug 4527731
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2427
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2428
        m = p.matcher("blah1\u0085");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2429
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2430
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2431
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2432
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2433
        p = Pattern.compile("^.*$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2434
        m = p.matcher(toSupplementaries("blah1\r\nblah2"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2435
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2436
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2437
        if (!m.group().equals(toSupplementaries("blah2")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2438
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2439
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2440
        m.reset(toSupplementaries("blah1\n\rblah2"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2441
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2442
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2443
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2444
        if (!m.group().equals(toSupplementaries("blah2")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2445
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2446
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2447
        // Test behavior of $ with \r\n at end of input
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2448
        p = Pattern.compile(".+$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2449
        m = p.matcher(toSupplementaries("blah1\r\n"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2450
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2451
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2452
        if (!m.group().equals(toSupplementaries("blah1")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2453
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2454
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2455
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2456
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2457
        // Test behavior of $ with \r\n at end of input in multiline
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2458
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2459
        m = p.matcher(toSupplementaries("blah1\r\n"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2460
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2461
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2462
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2463
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2464
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2465
        // Test for $ recognition of \u0085 for bug 4527731
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2466
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2467
        m = p.matcher(toSupplementaries("blah1\u0085"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2468
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2469
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2470
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2471
        report("Anchors");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2472
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2473
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2474
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2475
     * A basic sanity test of Matcher.lookingAt().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2476
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2477
    private static void lookingAtTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2478
        Pattern p = Pattern.compile("(ab)(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2479
        Matcher m = p.matcher("abccczzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2480
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2481
        if (!m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2482
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2483
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2484
        if (!m.group().equals(m.group(0)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2485
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2486
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2487
        m = p.matcher("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2488
        if (m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2489
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2490
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2491
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2492
        p = Pattern.compile(toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2493
        m = p.matcher(toSupplementaries("abccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2494
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2495
        if (!m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2496
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2497
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2498
        if (!m.group().equals(m.group(0)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2499
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2500
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2501
        m = p.matcher(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2502
        if (m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2503
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2504
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2505
        report("Looking At");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2506
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2507
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2508
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2509
     * A basic sanity test of Matcher.matches().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2510
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2511
    private static void matchesTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2512
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2513
        Pattern p = Pattern.compile("ulb(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2514
        Matcher m = p.matcher("ulbcccccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2515
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2516
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2517
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2518
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2519
        m.reset("zzzulbcccccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2520
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2521
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2522
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2523
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2524
        m.reset("ulbccccccdef");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2525
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2526
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2527
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2528
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2529
        p = Pattern.compile("a|ad");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2530
        m = p.matcher("ad");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2531
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2532
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2533
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2534
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2535
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2536
        p = Pattern.compile(toSupplementaries("ulb(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2537
        m = p.matcher(toSupplementaries("ulbcccccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2538
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2539
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2540
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2541
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2542
        m.reset(toSupplementaries("zzzulbcccccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2543
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2544
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2545
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2546
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2547
        m.reset(toSupplementaries("ulbccccccdef"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2548
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2549
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2550
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2551
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2552
        p = Pattern.compile(toSupplementaries("a|ad"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2553
        m = p.matcher(toSupplementaries("ad"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2554
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2555
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2556
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2557
        report("Matches");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2558
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2559
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2560
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2561
     * A basic sanity test of Pattern.matches().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2562
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2563
    private static void patternMatchesTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2564
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2565
        if (!Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2566
                             toSupplementaries("ulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2567
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2568
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2569
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2570
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2571
                            toSupplementaries("zzzulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2572
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2573
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2574
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2575
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2576
                            toSupplementaries("ulbccccccdef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2577
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2578
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2579
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2580
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2581
        if (!Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2582
                             toSupplementaries("ulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2583
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2584
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2585
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2586
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2587
                            toSupplementaries("zzzulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2588
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2589
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2590
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2591
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2592
                            toSupplementaries("ulbccccccdef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2593
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2594
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2595
        report("Pattern Matches");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2596
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2597
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2598
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2599
     * Canonical equivalence testing. Tests the ability of the engine
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2600
     * to match sequences that are not explicitly specified in the
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2601
     * pattern when they are considered equivalent by the Unicode Standard.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2602
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2603
    private static void ceTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2604
        // Decomposed char outside char classes
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2605
        Pattern p = Pattern.compile("testa\u030a", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2606
        Matcher m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2607
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2608
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2609
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2610
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2611
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2612
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2613
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2614
        // Composed char outside char classes
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2615
        p = Pattern.compile("test\u00e5", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2616
        m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2617
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2618
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2619
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2620
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2621
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2622
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2623
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2624
        // Decomposed char inside a char class
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2625
        p = Pattern.compile("test[abca\u030a]", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2626
        m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2627
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2628
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2629
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2630
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2631
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2632
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2633
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2634
        // Composed char inside a char class
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2635
        p = Pattern.compile("test[abc\u00e5def\u00e0]", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2636
        m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2637
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2638
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2639
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2640
        m.reset("testa\u0300");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2641
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2642
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2643
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2644
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2645
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2646
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2647
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2648
        // Marks that cannot legally change order and be equivalent
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2649
        p = Pattern.compile("testa\u0308\u0300", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2650
        check(p, "testa\u0308\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2651
        check(p, "testa\u0300\u0308", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2652
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2653
        // Marks that can legally change order and be equivalent
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2654
        p = Pattern.compile("testa\u0308\u0323", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2655
        check(p, "testa\u0308\u0323", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2656
        check(p, "testa\u0323\u0308", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2657
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2658
        // Test all equivalences of the sequence a\u0308\u0323\u0300
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2659
        p = Pattern.compile("testa\u0308\u0323\u0300", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2660
        check(p, "testa\u0308\u0323\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2661
        check(p, "testa\u0323\u0308\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2662
        check(p, "testa\u0308\u0300\u0323", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2663
        check(p, "test\u00e4\u0323\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2664
        check(p, "test\u00e4\u0300\u0323", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2665
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2666
        Object[][] data = new Object[][] {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2667
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2668
        // JDK-4867170
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2669
        { "[\u1f80-\u1f82]", "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2670
        { "[\u1f80-\u1f82]", "ab\u1f81cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2671
        { "[\u1f80-\u1f82]", "ab\u1f82cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2672
        { "[\u1f80-\u1f82]", "ab\u03b1\u0314\u0345cd", "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2673
        { "[\u1f80-\u1f82]", "ab\u03b1\u0345\u0314cd", "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2674
        { "[\u1f80-\u1f82]", "ab\u1f01\u0345cd",       "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2675
        { "[\u1f80-\u1f82]", "ab\u1f00\u0345cd",       "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2676
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2677
        { "\\p{IsGreek}",    "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2678
        { "\\p{IsGreek}",    "ab\u1f81cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2679
        { "\\p{IsGreek}",    "ab\u1f82cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2680
        { "\\p{IsGreek}",    "ab\u03b1\u0314\u0345cd", "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2681
        { "\\p{IsGreek}",    "ab\u1f01\u0345cd",       "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2682
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2683
        // backtracking, force to match "\u1f80", instead of \u1f82"
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2684
        { "ab\\p{IsGreek}\u0300cd", "ab\u03b1\u0313\u0345\u0300cd", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2685
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2686
        { "[\\p{IsGreek}]",  "\u03b1\u0314\u0345",     "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2687
        { "\\p{IsGreek}",    "\u03b1\u0314\u0345",     "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2688
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2689
        { "[^\u1f80-\u1f82]","\u1f81",                 "m", false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2690
        { "[^\u1f80-\u1f82]","\u03b1\u0314\u0345",     "m", false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2691
        { "[^\u1f01\u0345]", "\u1f81",                 "f", false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2692
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2693
        { "[^\u1f81]+",      "\u1f80\u1f82",           "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2694
        { "[\u1f80]",        "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2695
        { "\u1f80",          "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2696
        { "\u1f00\u0345\u0300",  "\u1f82", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2697
        { "\u1f80",          "-\u1f00\u0345\u0300-",   "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2698
        { "\u1f82",          "\u1f00\u0345\u0300",     "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2699
        { "\u1f82",          "\u1f80\u0300",           "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2700
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2701
        // JDK-7080302       # compile failed
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2702
        { "a(\u0041\u0301\u0328)", "a\u0041\u0301\u0328", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2703
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2704
        // JDK-6728861, same cause as above one
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2705
        { "\u00e9\u00e9n", "e\u0301e\u0301n", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2706
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2707
        // JDK-6995635
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2708
        { "(\u00e9)", "e\u0301", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2709
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2710
        // JDK-6736245
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2711
        // intereting special case, nfc(u2add+u0338) -> u2add+u0338) NOT u2adc
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2712
        { "\u2ADC", "\u2ADC", "m", true},          // NFC
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2713
        { "\u2ADC", "\u2ADD\u0338", "m", true},    // NFD
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2714
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2715
        //  4916384.
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2716
        // Decomposed hangul (jamos) works inside clazz
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2717
        { "[\u1100\u1161]", "\u1100\u1161", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2718
        { "[\u1100\u1161]", "\uac00", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2719
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2720
        { "[\uac00]", "\u1100\u1161", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2721
        { "[\uac00]", "\uac00", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2722
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2723
        // Decomposed hangul (jamos)
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2724
        { "\u1100\u1161", "\u1100\u1161", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2725
        { "\u1100\u1161", "\uac00", "m", true},
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2726
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2727
        // Composed hangul
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2728
        { "\uac00",  "\u1100\u1161", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2729
        { "\uac00",  "\uac00", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2730
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2731
        /* Need a NFDSlice to nfd the source to solve this issue
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2732
           u+1d1c0 -> nfd: <u+1d1ba><u+1d165><u+1d16f>  -> nfc: <u+1d1ba><u+1d165><u+1d16f>
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2733
           u+1d1bc -> nfd: <u+1d1ba><u+1d165>           -> nfc: <u+1d1ba><u+1d165>
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2734
           <u+1d1bc><u+1d16f> -> nfd: <u+1d1ba><u+1d165><u+1d16f> -> nfc: <u+1d1ba><u+1d165><u+1d16f>
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2735
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2736
        // Decomposed supplementary outside char classes
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2737
        // { "test\ud834\uddbc\ud834\udd6f", "test\ud834\uddc0", "m", true },
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2738
        // Composed supplementary outside char classes
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2739
        // { "test\ud834\uddc0", "test\ud834\uddbc\ud834\udd6f", "m", true },
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2740
        */
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2741
        { "test\ud834\uddbc\ud834\udd6f", "test\ud834\uddbc\ud834\udd6f", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2742
        { "test\ud834\uddc0",             "test\ud834\uddbc\ud834\udd6f", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2743
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2744
        { "test\ud834\uddc0",             "test\ud834\uddc0",             "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2745
        { "test\ud834\uddbc\ud834\udd6f", "test\ud834\uddc0",             "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2746
        };
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2747
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2748
        int failCount = 0;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2749
        for (Object[] d : data) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2750
            String pn = (String)d[0];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2751
            String tt = (String)d[1];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2752
            boolean isFind = "f".equals(((String)d[2]));
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2753
            boolean expected = (boolean)d[3];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2754
            boolean ret = isFind ? Pattern.compile(pn, Pattern.CANON_EQ).matcher(tt).find()
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2755
                                 : Pattern.compile(pn, Pattern.CANON_EQ).matcher(tt).matches();
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2756
            if (ret != expected) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2757
                failCount++;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2758
                continue;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2759
            }
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2760
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2761
        report("Canonical Equivalence");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2762
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2763
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2764
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2765
     * A basic sanity test of Matcher.replaceAll().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2766
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2767
    private static void globalSubstitute() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2768
        // Global substitution with a literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2769
        Pattern p = Pattern.compile("(ab)(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2770
        Matcher m = p.matcher("abccczzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2771
        if (!m.replaceAll("test").equals("testzzztestzzztest"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2772
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2773
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2774
        m.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2775
        if (!m.replaceAll("test").equals("zzztestzzztestzzztestzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2776
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2777
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2778
        // Global substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2779
        m.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2780
        String result = m.replaceAll("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2781
        if (!result.equals("zzzabzzzabzzzabzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2782
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2783
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2784
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2785
        // Global substitution with a literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2786
        p = Pattern.compile(toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2787
        m = p.matcher(toSupplementaries("abccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2788
        if (!m.replaceAll(toSupplementaries("test")).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2789
            equals(toSupplementaries("testzzztestzzztest")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2790
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2791
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2792
        m.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2793
        if (!m.replaceAll(toSupplementaries("test")).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2794
            equals(toSupplementaries("zzztestzzztestzzztestzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2795
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2796
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2797
        // Global substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2798
        m.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2799
        result = m.replaceAll("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2800
        if (!result.equals(toSupplementaries("zzzabzzzabzzzabzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2801
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2802
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2803
        report("Global Substitution");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2804
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2805
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2806
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2807
     * Tests the usage of Matcher.appendReplacement() with literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2808
     * and group substitutions.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2809
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2810
    private static void stringbufferSubstitute() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2811
        // SB substitution with literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2812
        String blah = "zzzblahzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2813
        Pattern p = Pattern.compile("blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2814
        Matcher m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2815
        StringBuffer result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2816
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2817
            m.appendReplacement(result, "blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2818
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2819
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2820
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2821
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2822
        m.appendReplacement(result, "blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2823
        if (!result.toString().equals("zzzblech"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2824
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2825
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2826
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2827
        if (!result.toString().equals("zzzblechzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2828
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2829
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2830
        // SB substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2831
        blah = "zzzabcdzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2832
        p = Pattern.compile("(ab)(cd)*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2833
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2834
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2835
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2836
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2837
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2838
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2839
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2840
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2841
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2842
        if (!result.toString().equals("zzzab"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2843
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2844
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2845
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2846
        if (!result.toString().equals("zzzabzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2847
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2848
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2849
        // SB substitution with 3 groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2850
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2851
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2852
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2853
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2854
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2855
            m.appendReplacement(result, "$1w$2w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2856
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2857
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2858
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2859
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2860
        m.appendReplacement(result, "$1w$2w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2861
        if (!result.toString().equals("zzzabwcdwef"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2862
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2863
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2864
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2865
        if (!result.toString().equals("zzzabwcdwefzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2866
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2867
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2868
        // SB substitution with groups and three matches
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2869
        // skipping middle match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2870
        blah = "zzzabcdzzzabcddzzzabcdzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2871
        p = Pattern.compile("(ab)(cd*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2872
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2873
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2874
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2875
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2876
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2877
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2878
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2879
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2880
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2881
        if (!result.toString().equals("zzzab"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2882
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2883
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2884
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2885
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2886
        m.appendReplacement(result, "$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2887
        if (!result.toString().equals("zzzabzzzabcddzzzcd"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2888
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2889
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2890
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2891
        if (!result.toString().equals("zzzabzzzabcddzzzcdzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2892
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2893
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2894
        // Check to make sure escaped $ is ignored
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2895
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2896
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2897
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2898
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2899
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2900
        m.appendReplacement(result, "$1w\\$2w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2901
        if (!result.toString().equals("zzzabw$2wef"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2902
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2903
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2904
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2905
        if (!result.toString().equals("zzzabw$2wefzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2906
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2907
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2908
        // Check to make sure a reference to nonexistent group causes error
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2909
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2910
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2911
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2912
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2913
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2914
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2915
            m.appendReplacement(result, "$1w$5w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2916
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2917
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2918
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2919
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2920
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2921
        // Check double digit group references
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2922
        blah = "zzz123456789101112zzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2923
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2924
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2925
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2926
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2927
        m.appendReplacement(result, "$1w$11w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2928
        if (!result.toString().equals("zzz1w11w3"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2929
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2930
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2931
        // Check to make sure it backs off $15 to $1 if only three groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2932
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2933
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2934
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2935
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2936
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2937
        m.appendReplacement(result, "$1w$15w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2938
        if (!result.toString().equals("zzzabwab5wef"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2939
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2940
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2941
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2942
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2943
        // SB substitution with literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2944
        blah = toSupplementaries("zzzblahzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2945
        p = Pattern.compile(toSupplementaries("blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2946
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2947
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2948
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2949
            m.appendReplacement(result, toSupplementaries("blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2950
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2951
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2952
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2953
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2954
        m.appendReplacement(result, toSupplementaries("blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2955
        if (!result.toString().equals(toSupplementaries("zzzblech")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2956
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2957
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2958
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2959
        if (!result.toString().equals(toSupplementaries("zzzblechzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2960
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2961
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2962
        // SB substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2963
        blah = toSupplementaries("zzzabcdzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2964
        p = Pattern.compile(toSupplementaries("(ab)(cd)*"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2965
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2966
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2967
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2968
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2969
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2970
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2971
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2972
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2973
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2974
        if (!result.toString().equals(toSupplementaries("zzzab")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2975
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2976
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2977
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2978
        if (!result.toString().equals(toSupplementaries("zzzabzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2979
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2980
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2981
        // SB substitution with 3 groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2982
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2983
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2984
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2985
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2986
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2987
            m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2988
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2989
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2990
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2991
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2992
        m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2993
        if (!result.toString().equals(toSupplementaries("zzzabwcdwef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2994
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2995
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2996
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2997
        if (!result.toString().equals(toSupplementaries("zzzabwcdwefzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2998
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2999
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3000
        // SB substitution with groups and three matches
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3001
        // skipping middle match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3002
        blah = toSupplementaries("zzzabcdzzzabcddzzzabcdzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3003
        p = Pattern.compile(toSupplementaries("(ab)(cd*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3004
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3005
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3006
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3007
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3008
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3009
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3010
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3011
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3012
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3013
        if (!result.toString().equals(toSupplementaries("zzzab")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3014
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3015
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3016
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3017
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3018
        m.appendReplacement(result, "$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3019
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcd")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3020
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3021
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3022
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3023
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcdzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3024
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3025
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3026
        // Check to make sure escaped $ is ignored
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3027
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3028
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3029
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3030
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3031
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3032
        m.appendReplacement(result, toSupplementaries("$1w\\$2w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3033
        if (!result.toString().equals(toSupplementaries("zzzabw$2wef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3034
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3035
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3036
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3037
        if (!result.toString().equals(toSupplementaries("zzzabw$2wefzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3038
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3039
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3040
        // Check to make sure a reference to nonexistent group causes error
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3041
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3042
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3043
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3044
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3045
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3046
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3047
            m.appendReplacement(result, toSupplementaries("$1w$5w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3048
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3049
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3050
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3051
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3052
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3053
        // Check double digit group references
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3054
        blah = toSupplementaries("zzz123456789101112zzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3055
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3056
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3057
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3058
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3059
        m.appendReplacement(result, toSupplementaries("$1w$11w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3060
        if (!result.toString().equals(toSupplementaries("zzz1w11w3")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3061
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3062
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3063
        // Check to make sure it backs off $15 to $1 if only three groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3064
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3065
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3066
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3067
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3068
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3069
        m.appendReplacement(result, toSupplementaries("$1w$15w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3070
        if (!result.toString().equals(toSupplementaries("zzzabwab5wef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3071
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3072
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3073
        // Check nothing has been appended into the output buffer if
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3074
        // the replacement string triggers IllegalArgumentException.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3075
        p = Pattern.compile("(abc)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3076
        m = p.matcher("abcd");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3077
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3078
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3079
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3080
            m.appendReplacement(result, ("xyz$g"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3081
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3082
        } catch (IllegalArgumentException iae) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3083
            if (result.length() != 0)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3084
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3085
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3086
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3087
        report("SB Substitution");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3088
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3089
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3090
    /**
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3091
     * Tests the usage of Matcher.appendReplacement() with literal
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3092
     * and group substitutions.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3093
     */
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3094
    private static void stringbuilderSubstitute() throws Exception {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3095
        // SB substitution with literal
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3096
        String blah = "zzzblahzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3097
        Pattern p = Pattern.compile("blah");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3098
        Matcher m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3099
        StringBuilder result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3100
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3101
            m.appendReplacement(result, "blech");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3102
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3103
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3104
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3105
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3106
        m.appendReplacement(result, "blech");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3107
        if (!result.toString().equals("zzzblech"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3108
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3109
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3110
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3111
        if (!result.toString().equals("zzzblechzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3112
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3113
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3114
        // SB substitution with groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3115
        blah = "zzzabcdzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3116
        p = Pattern.compile("(ab)(cd)*");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3117
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3118
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3119
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3120
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3121
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3122
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3123
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3124
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3125
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3126
        if (!result.toString().equals("zzzab"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3127
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3128
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3129
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3130
        if (!result.toString().equals("zzzabzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3131
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3132
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3133
        // SB substitution with 3 groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3134
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3135
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3136
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3137
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3138
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3139
            m.appendReplacement(result, "$1w$2w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3140
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3141
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3142
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3143
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3144
        m.appendReplacement(result, "$1w$2w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3145
        if (!result.toString().equals("zzzabwcdwef"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3146
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3147
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3148
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3149
        if (!result.toString().equals("zzzabwcdwefzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3150
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3151
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3152
        // SB substitution with groups and three matches
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3153
        // skipping middle match
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3154
        blah = "zzzabcdzzzabcddzzzabcdzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3155
        p = Pattern.compile("(ab)(cd*)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3156
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3157
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3158
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3159
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3160
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3161
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3162
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3163
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3164
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3165
        if (!result.toString().equals("zzzab"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3166
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3167
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3168
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3169
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3170
        m.appendReplacement(result, "$2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3171
        if (!result.toString().equals("zzzabzzzabcddzzzcd"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3172
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3173
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3174
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3175
        if (!result.toString().equals("zzzabzzzabcddzzzcdzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3176
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3177
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3178
        // Check to make sure escaped $ is ignored
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3179
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3180
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3181
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3182
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3183
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3184
        m.appendReplacement(result, "$1w\\$2w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3185
        if (!result.toString().equals("zzzabw$2wef"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3186
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3187
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3188
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3189
        if (!result.toString().equals("zzzabw$2wefzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3190
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3191
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3192
        // Check to make sure a reference to nonexistent group causes error
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3193
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3194
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3195
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3196
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3197
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3198
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3199
            m.appendReplacement(result, "$1w$5w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3200
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3201
        } catch (IndexOutOfBoundsException ioobe) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3202
            // Correct result
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3203
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3204
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3205
        // Check double digit group references
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3206
        blah = "zzz123456789101112zzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3207
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3208
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3209
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3210
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3211
        m.appendReplacement(result, "$1w$11w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3212
        if (!result.toString().equals("zzz1w11w3"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3213
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3214
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3215
        // Check to make sure it backs off $15 to $1 if only three groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3216
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3217
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3218
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3219
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3220
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3221
        m.appendReplacement(result, "$1w$15w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3222
        if (!result.toString().equals("zzzabwab5wef"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3223
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3224
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3225
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3226
        // Supplementary character test
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3227
        // SB substitution with literal
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3228
        blah = toSupplementaries("zzzblahzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3229
        p = Pattern.compile(toSupplementaries("blah"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3230
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3231
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3232
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3233
            m.appendReplacement(result, toSupplementaries("blech"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3234
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3235
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3236
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3237
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3238
        m.appendReplacement(result, toSupplementaries("blech"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3239
        if (!result.toString().equals(toSupplementaries("zzzblech")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3240
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3241
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3242
        if (!result.toString().equals(toSupplementaries("zzzblechzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3243
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3244
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3245
        // SB substitution with groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3246
        blah = toSupplementaries("zzzabcdzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3247
        p = Pattern.compile(toSupplementaries("(ab)(cd)*"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3248
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3249
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3250
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3251
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3252
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3253
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3254
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3255
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3256
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3257
        if (!result.toString().equals(toSupplementaries("zzzab")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3258
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3259
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3260
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3261
        if (!result.toString().equals(toSupplementaries("zzzabzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3262
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3263
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3264
        // SB substitution with 3 groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3265
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3266
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3267
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3268
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3269
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3270
            m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3271
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3272
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3273
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3274
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3275
        m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3276
        if (!result.toString().equals(toSupplementaries("zzzabwcdwef")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3277
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3278
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3279
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3280
        if (!result.toString().equals(toSupplementaries("zzzabwcdwefzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3281
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3282
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3283
        // SB substitution with groups and three matches
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3284
        // skipping middle match
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3285
        blah = toSupplementaries("zzzabcdzzzabcddzzzabcdzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3286
        p = Pattern.compile(toSupplementaries("(ab)(cd*)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3287
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3288
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3289
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3290
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3291
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3292
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3293
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3294
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3295
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3296
        if (!result.toString().equals(toSupplementaries("zzzab")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3297
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3298
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3299
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3300
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3301
        m.appendReplacement(result, "$2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3302
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcd")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3303
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3304
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3305
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3306
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcdzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3307
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3308
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3309
        // Check to make sure escaped $ is ignored
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3310
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3311
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3312
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3313
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3314
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3315
        m.appendReplacement(result, toSupplementaries("$1w\\$2w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3316
        if (!result.toString().equals(toSupplementaries("zzzabw$2wef")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3317
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3318
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3319
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3320
        if (!result.toString().equals(toSupplementaries("zzzabw$2wefzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3321
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3322
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3323
        // Check to make sure a reference to nonexistent group causes error
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3324
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3325
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3326
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3327
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3328
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3329
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3330
            m.appendReplacement(result, toSupplementaries("$1w$5w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3331
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3332
        } catch (IndexOutOfBoundsException ioobe) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3333
            // Correct result
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3334
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3335
        // Check double digit group references
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3336
        blah = toSupplementaries("zzz123456789101112zzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3337
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3338
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3339
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3340
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3341
        m.appendReplacement(result, toSupplementaries("$1w$11w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3342
        if (!result.toString().equals(toSupplementaries("zzz1w11w3")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3343
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3344
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3345
        // Check to make sure it backs off $15 to $1 if only three groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3346
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3347
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3348
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3349
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3350
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3351
        m.appendReplacement(result, toSupplementaries("$1w$15w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3352
        if (!result.toString().equals(toSupplementaries("zzzabwab5wef")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3353
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3354
        // Check nothing has been appended into the output buffer if
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3355
        // the replacement string triggers IllegalArgumentException.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3356
        p = Pattern.compile("(abc)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3357
        m = p.matcher("abcd");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3358
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3359
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3360
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3361
            m.appendReplacement(result, ("xyz$g"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3362
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3363
        } catch (IllegalArgumentException iae) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3364
            if (result.length() != 0)
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3365
                failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3366
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3367
        report("SB Substitution 2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3368
    }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3369
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3370
    /*
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3371
     * 5 groups of characters are created to make a substitution string.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3372
     * A base string will be created including random lead chars, the
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3373
     * substitution string, and random trailing chars.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3374
     * A pattern containing the 5 groups is searched for and replaced with:
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3375
     * random group + random string + random group.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3376
     * The results are checked for correctness.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3377
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3378
    private static void substitutionBasher() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3379
        for (int runs = 0; runs<1000; runs++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3380
            // Create a base string to work in
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3381
            int leadingChars = generator.nextInt(10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3382
            StringBuffer baseBuffer = new StringBuffer(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3383
            String leadingString = getRandomAlphaString(leadingChars);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3384
            baseBuffer.append(leadingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3385
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3386
            // Create 5 groups of random number of random chars
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3387
            // Create the string to substitute
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3388
            // Create the pattern string to search for
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3389
            StringBuffer bufferToSub = new StringBuffer(25);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3390
            StringBuffer bufferToPat = new StringBuffer(50);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3391
            String[] groups = new String[5];
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3392
            for(int i=0; i<5; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3393
                int aGroupSize = generator.nextInt(5)+1;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3394
                groups[i] = getRandomAlphaString(aGroupSize);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3395
                bufferToSub.append(groups[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3396
                bufferToPat.append('(');
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3397
                bufferToPat.append(groups[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3398
                bufferToPat.append(')');
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3399
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3400
            String stringToSub = bufferToSub.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3401
            String pattern = bufferToPat.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3402
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3403
            // Place sub string into working string at random index
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3404
            baseBuffer.append(stringToSub);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3405
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3406
            // Append random chars to end
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3407
            int trailingChars = generator.nextInt(10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3408
            String trailingString = getRandomAlphaString(trailingChars);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3409
            baseBuffer.append(trailingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3410
            String baseString = baseBuffer.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3411
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3412
            // Create test pattern and matcher
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3413
            Pattern p = Pattern.compile(pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3414
            Matcher m = p.matcher(baseString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3415
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3416
            // Reject candidate if pattern happens to start early
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3417
            m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3418
            if (m.start() < leadingChars)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3419
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3420
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3421
            // Reject candidate if more than one match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3422
            if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3423
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3424
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3425
            // Construct a replacement string with :
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3426
            // random group + random string + random group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3427
            StringBuffer bufferToRep = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3428
            int groupIndex1 = generator.nextInt(5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3429
            bufferToRep.append("$" + (groupIndex1 + 1));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3430
            String randomMidString = getRandomAlphaString(5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3431
            bufferToRep.append(randomMidString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3432
            int groupIndex2 = generator.nextInt(5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3433
            bufferToRep.append("$" + (groupIndex2 + 1));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3434
            String replacement = bufferToRep.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3435
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3436
            // Do the replacement
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3437
            String result = m.replaceAll(replacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3438
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3439
            // Construct expected result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3440
            StringBuffer bufferToRes = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3441
            bufferToRes.append(leadingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3442
            bufferToRes.append(groups[groupIndex1]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3443
            bufferToRes.append(randomMidString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3444
            bufferToRes.append(groups[groupIndex2]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3445
            bufferToRes.append(trailingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3446
            String expectedResult = bufferToRes.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3447
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3448
            // Check results
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3449
            if (!result.equals(expectedResult))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3450
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3451
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3452
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3453
        report("Substitution Basher");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3454
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3455
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3456
    /*
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3457
     * 5 groups of characters are created to make a substitution string.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3458
     * A base string will be created including random lead chars, the
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3459
     * substitution string, and random trailing chars.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3460
     * A pattern containing the 5 groups is searched for and replaced with:
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3461
     * random group + random string + random group.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3462
     * The results are checked for correctness.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3463
     */
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3464
    private static void substitutionBasher2() {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3465
        for (int runs = 0; runs<1000; runs++) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3466
            // Create a base string to work in
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3467
            int leadingChars = generator.nextInt(10);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3468
            StringBuilder baseBuffer = new StringBuilder(100);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3469
            String leadingString = getRandomAlphaString(leadingChars);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3470
            baseBuffer.append(leadingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3471
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3472
            // Create 5 groups of random number of random chars
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3473
            // Create the string to substitute
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3474
            // Create the pattern string to search for
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3475
            StringBuilder bufferToSub = new StringBuilder(25);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3476
            StringBuilder bufferToPat = new StringBuilder(50);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3477
            String[] groups = new String[5];
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3478
            for(int i=0; i<5; i++) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3479
                int aGroupSize = generator.nextInt(5)+1;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3480
                groups[i] = getRandomAlphaString(aGroupSize);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3481
                bufferToSub.append(groups[i]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3482
                bufferToPat.append('(');
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3483
                bufferToPat.append(groups[i]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3484
                bufferToPat.append(')');
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3485
            }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3486
            String stringToSub = bufferToSub.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3487
            String pattern = bufferToPat.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3488
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3489
            // Place sub string into working string at random index
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3490
            baseBuffer.append(stringToSub);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3491
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3492
            // Append random chars to end
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3493
            int trailingChars = generator.nextInt(10);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3494
            String trailingString = getRandomAlphaString(trailingChars);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3495
            baseBuffer.append(trailingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3496
            String baseString = baseBuffer.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3497
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3498
            // Create test pattern and matcher
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3499
            Pattern p = Pattern.compile(pattern);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3500
            Matcher m = p.matcher(baseString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3501
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3502
            // Reject candidate if pattern happens to start early
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3503
            m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3504
            if (m.start() < leadingChars)
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3505
                continue;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3506
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3507
            // Reject candidate if more than one match
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3508
            if (m.find())
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3509
                continue;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3510
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3511
            // Construct a replacement string with :
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3512
            // random group + random string + random group
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3513
            StringBuilder bufferToRep = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3514
            int groupIndex1 = generator.nextInt(5);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3515
            bufferToRep.append("$" + (groupIndex1 + 1));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3516
            String randomMidString = getRandomAlphaString(5);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3517
            bufferToRep.append(randomMidString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3518
            int groupIndex2 = generator.nextInt(5);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3519
            bufferToRep.append("$" + (groupIndex2 + 1));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3520
            String replacement = bufferToRep.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3521
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3522
            // Do the replacement
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3523
            String result = m.replaceAll(replacement);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3524
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3525
            // Construct expected result
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3526
            StringBuilder bufferToRes = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3527
            bufferToRes.append(leadingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3528
            bufferToRes.append(groups[groupIndex1]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3529
            bufferToRes.append(randomMidString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3530
            bufferToRes.append(groups[groupIndex2]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3531
            bufferToRes.append(trailingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3532
            String expectedResult = bufferToRes.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3533
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3534
            // Check results
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3535
            if (!result.equals(expectedResult)) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3536
                failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3537
            }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3538
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3539
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3540
        report("Substitution Basher 2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3541
    }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3542
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3543
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3544
     * Checks the handling of some escape sequences that the Pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3545
     * class should process instead of the java compiler. These are
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3546
     * not in the file because the escapes should be be processed
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3547
     * by the Pattern class when the regex is compiled.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3548
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3549
    private static void escapes() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3550
        Pattern p = Pattern.compile("\\043");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3551
        Matcher m = p.matcher("#");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3552
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3553
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3554
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3555
        p = Pattern.compile("\\x23");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3556
        m = p.matcher("#");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3557
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3558
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3559
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3560
        p = Pattern.compile("\\u0023");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3561
        m = p.matcher("#");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3562
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3563
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3564
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3565
        report("Escape sequences");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3566
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3567
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3568
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3569
     * Checks the handling of blank input situations. These
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3570
     * tests are incompatible with my test file format.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3571
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3572
    private static void blankInput() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3573
        Pattern p = Pattern.compile("abc", Pattern.CASE_INSENSITIVE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3574
        Matcher m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3575
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3576
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3577
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3578
        p = Pattern.compile("a*", Pattern.CASE_INSENSITIVE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3579
        m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3580
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3581
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3582
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3583
        p = Pattern.compile("abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3584
        m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3585
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3586
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3587
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3588
        p = Pattern.compile("a*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3589
        m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3590
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3591
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3592
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3593
        report("Blank input");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3594
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3595
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3596
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3597
     * Tests the Boyer-Moore pattern matching of a character sequence
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3598
     * on randomly generated patterns.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3599
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3600
    private static void bm() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3601
        doBnM('a');
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3602
        report("Boyer Moore (ASCII)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3603
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3604
        doBnM(Character.MIN_SUPPLEMENTARY_CODE_POINT - 10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3605
        report("Boyer Moore (Supplementary)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3606
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3607
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3608
    private static void doBnM(int baseCharacter) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3609
        int achar=0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3610
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3611
        for (int i=0; i<100; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3612
            // Create a short pattern to search for
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3613
            int patternLength = generator.nextInt(7) + 4;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3614
            StringBuffer patternBuffer = new StringBuffer(patternLength);
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3615
            String pattern;
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3616
            retry: for (;;) {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3617
                for (int x=0; x<patternLength; x++) {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3618
                    int ch = baseCharacter + generator.nextInt(26);
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3619
                    if (Character.isSupplementaryCodePoint(ch)) {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3620
                        patternBuffer.append(Character.toChars(ch));
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3621
                    } else {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3622
                        patternBuffer.append((char)ch);
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3623
                    }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3624
                }
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3625
                pattern = patternBuffer.toString();
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3626
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3627
                // Avoid patterns that start and end with the same substring
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3628
                // See JDK-6854417
34436
33c20335507c 8143854: java/util/regex/RegExTest.java.RegExTest failed
sherman
parents: 31645
diff changeset
  3629
                for (int x=1; x < pattern.length(); x++) {
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3630
                    if (pattern.startsWith(pattern.substring(x)))
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3631
                        continue retry;
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3632
                }
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3633
                break;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3634
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3635
            Pattern p = Pattern.compile(pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3636
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3637
            // Create a buffer with random ASCII chars that does
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3638
            // not match the sample
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3639
            String toSearch = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3640
            StringBuffer s = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3641
            Matcher m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3642
            do {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3643
                s = new StringBuffer(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3644
                for (int x=0; x<100; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3645
                    int ch = baseCharacter + generator.nextInt(26);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3646
                    if (Character.isSupplementaryCodePoint(ch)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3647
                        s.append(Character.toChars(ch));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3648
                    } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3649
                        s.append((char)ch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3650
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3651
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3652
                toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3653
                m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3654
            } while (m.find());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3655
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3656
            // Insert the pattern at a random spot
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3657
            int insertIndex = generator.nextInt(99);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3658
            if (Character.isLowSurrogate(s.charAt(insertIndex)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3659
                insertIndex++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3660
            s = s.insert(insertIndex, pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3661
            toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3662
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3663
            // Make sure that the pattern is found
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3664
            m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3665
            if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3666
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3667
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3668
            // Make sure that the match text is the pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3669
            if (!m.group().equals(pattern))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3670
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3671
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3672
            // Make sure match occured at insertion point
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3673
            if (m.start() != insertIndex)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3674
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3675
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3676
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3677
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3678
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3679
     * Tests the matching of slices on randomly generated patterns.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3680
     * The Boyer-Moore optimization is not done on these patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3681
     * because it uses unicode case folding.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3682
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3683
    private static void slice() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3684
        doSlice(Character.MAX_VALUE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3685
        report("Slice");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3686
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3687
        doSlice(Character.MAX_CODE_POINT);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3688
        report("Slice (Supplementary)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3689
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3690
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3691
    private static void doSlice(int maxCharacter) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3692
        Random generator = new Random();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3693
        int achar=0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3694
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3695
        for (int i=0; i<100; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3696
            // Create a short pattern to search for
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3697
            int patternLength = generator.nextInt(7) + 4;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3698
            StringBuffer patternBuffer = new StringBuffer(patternLength);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3699
            for (int x=0; x<patternLength; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3700
                int randomChar = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3701
                while (!Character.isLetterOrDigit(randomChar))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3702
                    randomChar = generator.nextInt(maxCharacter);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3703
                if (Character.isSupplementaryCodePoint(randomChar)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3704
                    patternBuffer.append(Character.toChars(randomChar));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3705
                } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3706
                    patternBuffer.append((char) randomChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3707
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3708
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3709
            String pattern =  patternBuffer.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3710
            Pattern p = Pattern.compile(pattern, Pattern.UNICODE_CASE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3711
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3712
            // Create a buffer with random chars that does not match the sample
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3713
            String toSearch = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3714
            StringBuffer s = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3715
            Matcher m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3716
            do {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3717
                s = new StringBuffer(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3718
                for (int x=0; x<100; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3719
                    int randomChar = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3720
                    while (!Character.isLetterOrDigit(randomChar))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3721
                        randomChar = generator.nextInt(maxCharacter);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3722
                    if (Character.isSupplementaryCodePoint(randomChar)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3723
                        s.append(Character.toChars(randomChar));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3724
                    } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3725
                        s.append((char) randomChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3726
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3727
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3728
                toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3729
                m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3730
            } while (m.find());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3731
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3732
            // Insert the pattern at a random spot
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3733
            int insertIndex = generator.nextInt(99);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3734
            if (Character.isLowSurrogate(s.charAt(insertIndex)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3735
                insertIndex++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3736
            s = s.insert(insertIndex, pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3737
            toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3738
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3739
            // Make sure that the pattern is found
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3740
            m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3741
            if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3742
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3743
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3744
            // Make sure that the match text is the pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3745
            if (!m.group().equals(pattern))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3746
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3747
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3748
            // Make sure match occured at insertion point
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3749
            if (m.start() != insertIndex)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3750
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3751
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3752
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3753
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3754
    private static void explainFailure(String pattern, String data,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3755
                                       String expected, String actual) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3756
        System.err.println("----------------------------------------");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3757
        System.err.println("Pattern = "+pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3758
        System.err.println("Data = "+data);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3759
        System.err.println("Expected = " + expected);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3760
        System.err.println("Actual   = " + actual);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3761
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3762
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3763
    private static void explainFailure(String pattern, String data,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3764
                                       Throwable t) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3765
        System.err.println("----------------------------------------");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3766
        System.err.println("Pattern = "+pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3767
        System.err.println("Data = "+data);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3768
        t.printStackTrace(System.err);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3769
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3770
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3771
    // Testing examples from a file
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3772
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3773
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3774
     * Goes through the file "TestCases.txt" and creates many patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3775
     * described in the file, matching the patterns against input lines in
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3776
     * the file, and comparing the results against the correct results
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3777
     * also found in the file. The file format is described in comments
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3778
     * at the head of the file.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3779
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3780
    private static void processFile(String fileName) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3781
        File testCases = new File(System.getProperty("test.src", "."),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3782
                                  fileName);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3783
        FileInputStream in = new FileInputStream(testCases);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3784
        BufferedReader r = new BufferedReader(new InputStreamReader(in));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3785
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3786
        // Process next test case.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3787
        String aLine;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3788
        while((aLine = r.readLine()) != null) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3789
            // Read a line for pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3790
            String patternString = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3791
            Pattern p = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3792
            try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3793
                p = compileTestPattern(patternString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3794
            } catch (PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3795
                String dataString = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3796
                String expectedResult = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3797
                if (expectedResult.startsWith("error"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3798
                    continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3799
                explainFailure(patternString, dataString, e);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3800
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3801
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3802
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3803
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3804
            // Read a line for input string
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3805
            String dataString = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3806
            Matcher m = p.matcher(dataString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3807
            StringBuffer result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3808
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3809
            // Check for IllegalStateExceptions before a match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3810
            failCount += preMatchInvariants(m);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3811
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3812
            boolean found = m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3813
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3814
            if (found)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3815
                failCount += postTrueMatchInvariants(m);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3816
            else
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3817
                failCount += postFalseMatchInvariants(m);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3818
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3819
            if (found) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3820
                result.append("true ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3821
                result.append(m.group(0) + " ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3822
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3823
                result.append("false ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3824
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3825
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3826
            result.append(m.groupCount());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3827
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3828
            if (found) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3829
                for (int i=1; i<m.groupCount()+1; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3830
                    if (m.group(i) != null)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3831
                        result.append(" " +m.group(i));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3832
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3833
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3834
            // Read a line for the expected result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3835
            String expectedResult = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3836
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3837
            if (!result.toString().equals(expectedResult)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3838
                explainFailure(patternString, dataString, expectedResult, result.toString());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3839
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3840
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3841
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3842
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3843
        report(fileName);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3844
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3845
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3846
    private static int preMatchInvariants(Matcher m) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3847
        int failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3848
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3849
            m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3850
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3851
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3852
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3853
            m.end();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3854
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3855
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3856
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3857
            m.group();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3858
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3859
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3860
        return failCount;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3861
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3862
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3863
    private static int postFalseMatchInvariants(Matcher m) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3864
        int failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3865
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3866
            m.group();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3867
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3868
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3869
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3870
            m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3871
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3872
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3873
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3874
            m.end();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3875
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3876
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3877
        return failCount;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3878
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3879
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3880
    private static int postTrueMatchInvariants(Matcher m) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3881
        int failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3882
        //assert(m.start() = m.start(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3883
        if (m.start() != m.start(0))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3884
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3885
        //assert(m.end() = m.end(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3886
        if (m.start() != m.start(0))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3887
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3888
        //assert(m.group() = m.group(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3889
        if (!m.group().equals(m.group(0)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3890
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3891
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3892
            m.group(50);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3893
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3894
        } catch (IndexOutOfBoundsException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3895
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3896
        return failCount;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3897
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3898
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3899
    private static Pattern compileTestPattern(String patternString) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3900
        if (!patternString.startsWith("'")) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3901
            return Pattern.compile(patternString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3902
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3903
        int break1 = patternString.lastIndexOf("'");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3904
        String flagString = patternString.substring(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3905
                                          break1+1, patternString.length());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3906
        patternString = patternString.substring(1, break1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3907
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3908
        if (flagString.equals("i"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3909
            return Pattern.compile(patternString, Pattern.CASE_INSENSITIVE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3910
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3911
        if (flagString.equals("m"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3912
            return Pattern.compile(patternString, Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3913
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3914
        return Pattern.compile(patternString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3915
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3916
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3917
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3918
     * Reads a line from the input file. Keeps reading lines until a non
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3919
     * empty non comment line is read. If the line contains a \n then
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3920
     * these two characters are replaced by a newline char. If a \\uxxxx
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3921
     * sequence is read then the sequence is replaced by the unicode char.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3922
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3923
    private static String grabLine(BufferedReader r) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3924
        int index = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3925
        String line = r.readLine();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3926
        while (line.startsWith("//") || line.length() < 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3927
            line = r.readLine();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3928
        while ((index = line.indexOf("\\n")) != -1) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3929
            StringBuffer temp = new StringBuffer(line);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3930
            temp.replace(index, index+2, "\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3931
            line = temp.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3932
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3933
        while ((index = line.indexOf("\\u")) != -1) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3934
            StringBuffer temp = new StringBuffer(line);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3935
            String value = temp.substring(index+2, index+6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3936
            char aChar = (char)Integer.parseInt(value, 16);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3937
            String unicodeChar = "" + aChar;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3938
            temp.replace(index, index+6, unicodeChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3939
            line = temp.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3940
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3941
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3942
        return line;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3943
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3944
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3945
    private static void check(Pattern p, String s, String g, String expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3946
        Matcher m = p.matcher(s);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3947
        m.find();
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3948
        if (!m.group(g).equals(expected) ||
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3949
            s.charAt(m.start(g)) != expected.charAt(0) ||
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3950
            s.charAt(m.end(g) - 1) != expected.charAt(expected.length() - 1))
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3951
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3952
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3953
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3954
    private static void checkReplaceFirst(String p, String s, String r, String expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3955
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3956
        if (!expected.equals(Pattern.compile(p)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3957
                                    .matcher(s)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3958
                                    .replaceFirst(r)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3959
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3960
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3961
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3962
    private static void checkReplaceAll(String p, String s, String r, String expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3963
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3964
        if (!expected.equals(Pattern.compile(p)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3965
                                    .matcher(s)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3966
                                    .replaceAll(r)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3967
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3968
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3969
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3970
    private static void checkExpectedFail(String p) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3971
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3972
            Pattern.compile(p);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3973
        } catch (PatternSyntaxException pse) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3974
            //pse.printStackTrace();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3975
            return;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3976
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3977
        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3978
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3979
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3980
    private static void checkExpectedIAE(Matcher m, String g) {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3981
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3982
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3983
            m.group(g);
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3984
        } catch (IllegalArgumentException x) {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3985
            //iae.printStackTrace();
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3986
            try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3987
                m.start(g);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3988
            } catch (IllegalArgumentException xx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3989
                try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3990
                    m.start(g);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3991
                } catch (IllegalArgumentException xxx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3992
                    return;
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3993
                }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3994
            }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3995
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3996
        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3997
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3998
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3999
    private static void checkExpectedNPE(Matcher m) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4000
        m.find();
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4001
        try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4002
            m.group(null);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4003
        } catch (NullPointerException x) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4004
            try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4005
                m.start(null);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4006
            } catch (NullPointerException xx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4007
                try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4008
                    m.end(null);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4009
                } catch (NullPointerException xxx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4010
                    return;
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4011
                }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4012
            }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4013
        }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4014
        failCount++;
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4015
    }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4016
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4017
    private static void namedGroupCaptureTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4018
        check(Pattern.compile("x+(?<gname>y+)z+"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4019
              "xxxyyyzzz",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4020
              "gname",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4021
              "yyy");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4022
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4023
        check(Pattern.compile("x+(?<gname8>y+)z+"),
2290
3a3bde061968 6817475: named-capturing group name started with digit causes PSE exception
sherman
parents: 2070
diff changeset
  4024
              "xxxyyyzzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4025
              "gname8",
2290
3a3bde061968 6817475: named-capturing group name started with digit causes PSE exception
sherman
parents: 2070
diff changeset
  4026
              "yyy");
3a3bde061968 6817475: named-capturing group name started with digit causes PSE exception
sherman
parents: 2070
diff changeset
  4027
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4028
        //backref
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4029
        Pattern pattern = Pattern.compile("(a*)bc\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4030
        check(pattern, "zzzaabcazzz", true);  // found "abca"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4031
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4032
        check(Pattern.compile("(?<gname>a*)bc\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4033
              "zzzaabcaazzz", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4034
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4035
        check(Pattern.compile("(?<gname>abc)(def)\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4036
              "abcdefabc", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4037
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4038
        check(Pattern.compile("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)(?<gname>k)\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4039
              "abcdefghijkk", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4040
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4041
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4042
        check(Pattern.compile("(?<gname>" + toSupplementaries("a*)bc") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4043
              toSupplementaries("zzzaabcazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4044
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4045
        check(Pattern.compile("(?<gname>" + toSupplementaries("a*)bc") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4046
              toSupplementaries("zzzaabcaazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4047
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4048
        check(Pattern.compile("(?<gname>" + toSupplementaries("abc)(def)") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4049
              toSupplementaries("abcdefabc"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4050
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4051
        check(Pattern.compile(toSupplementaries("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4052
                              "(?<gname>" +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4053
                              toSupplementaries("k)") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4054
              toSupplementaries("abcdefghijkk"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4055
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4056
        check(Pattern.compile("x+(?<gname>y+)z+\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4057
              "xxxyyyzzzyyy",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4058
              "gname",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4059
              "yyy");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4060
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4061
        //replaceFirst/All
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4062
        checkReplaceFirst("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4063
                          "abccczzzabcczzzabccc",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4064
                          "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4065
                          "abzzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4066
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4067
        checkReplaceAll("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4068
                        "abccczzzabcczzzabccc",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4069
                        "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4070
                        "abzzzabzzzab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4071
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4072
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4073
        checkReplaceFirst("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4074
                          "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4075
                          "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4076
                          "zzzabzzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4077
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4078
        checkReplaceAll("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4079
                        "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4080
                        "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4081
                        "zzzabzzzabzzzabzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4082
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4083
        checkReplaceFirst("(?<gn1>ab)(?<gn2>c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4084
                          "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4085
                          "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4086
                          "zzzccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4087
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4088
        checkReplaceAll("(?<gn1>ab)(?<gn2>c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4089
                        "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4090
                        "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4091
                        "zzzccczzzcczzzccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4092
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4093
        //toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4094
        checkReplaceFirst("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4095
                           ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4096
                          toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4097
                          "${gn1}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4098
                          toSupplementaries("abzzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4099
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4100
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4101
        checkReplaceAll("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4102
                        ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4103
                        toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4104
                        "${gn1}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4105
                        toSupplementaries("abzzzabzzzab"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4106
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4107
        checkReplaceFirst("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4108
                           ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4109
                          toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4110
                          "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4111
                          toSupplementaries("ccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4112
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4113
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4114
        checkReplaceAll("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4115
                        ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4116
                        toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4117
                        "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4118
                        toSupplementaries("ccczzzcczzzccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4119
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4120
        checkReplaceFirst("(?<dog>Dog)AndCat",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4121
                          "zzzDogAndCatzzzDogAndCatzzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4122
                          "${dog}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4123
                          "zzzDogzzzDogAndCatzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4124
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4125
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4126
        checkReplaceAll("(?<dog>Dog)AndCat",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4127
                          "zzzDogAndCatzzzDogAndCatzzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4128
                          "${dog}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4129
                          "zzzDogzzzDogzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4131
        // backref in Matcher & String
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4132
        if (!"abcdefghij".replaceFirst("cd(?<gn>ef)gh", "${gn}").equals("abefij") ||
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4133
            !"abbbcbdbefgh".replaceAll("(?<gn>[a-e])b", "${gn}").equals("abcdefgh"))
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4134
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4135
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4136
        // negative
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4137
        checkExpectedFail("(?<groupnamehasnoascii.in>abc)(def)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4138
        checkExpectedFail("(?<groupnamehasnoascii_in>abc)(def)");
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4139
        checkExpectedFail("(?<6groupnamestartswithdigit>abc)(def)");
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4140
        checkExpectedFail("(?<gname>abc)(def)\\k<gnameX>");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4141
        checkExpectedFail("(?<gname>abc)(?<gname>def)\\k<gnameX>");
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4142
        checkExpectedIAE(Pattern.compile("(?<gname>abc)(def)").matcher("abcdef"),
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4143
                         "gnameX");
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4144
        checkExpectedNPE(Pattern.compile("(?<gname>abc)(def)").matcher("abcdef"));
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4145
        report("NamedGroupCapture");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4146
    }
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4147
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4148
    // This is for bug 6919132
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4149
    private static void nonBmpClassComplementTest() throws Exception {
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4150
        Pattern p = Pattern.compile("\\P{Lu}");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4151
        Matcher m = p.matcher(new String(new int[] {0x1d400}, 0, 1));
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4152
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4153
        if (m.find() && m.start() == 1)
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4154
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4155
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4156
        // from a unicode category
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4157
        p = Pattern.compile("\\P{Lu}");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4158
        m = p.matcher(new String(new int[] {0x1d400}, 0, 1));
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4159
        if (m.find())
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4160
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4161
        if (!m.hitEnd())
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4162
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4163
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4164
        // block
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4165
        p = Pattern.compile("\\P{InMathematicalAlphanumericSymbols}");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4166
        m = p.matcher(new String(new int[] {0x1d400}, 0, 1));
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4167
        if (m.find() && m.start() == 1)
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4168
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4169
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4170
        p = Pattern.compile("\\P{sc=GRANTHA}");
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4171
        m = p.matcher(new String(new int[] {0x11350}, 0, 1));
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4172
        if (m.find() && m.start() == 1)
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4173
            failCount++;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4174
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4175
        report("NonBmpClassComplement");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4176
    }
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4177
5610
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4178
    private static void unicodePropertiesTest() throws Exception {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4179
        // different forms
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4180
        if (!Pattern.compile("\\p{IsLu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4181
            !Pattern.compile("\\p{Lu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4182
            !Pattern.compile("\\p{gc=Lu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4183
            !Pattern.compile("\\p{general_category=Lu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4184
            !Pattern.compile("\\p{IsLatin}").matcher("B").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4185
            !Pattern.compile("\\p{sc=Latin}").matcher("B").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4186
            !Pattern.compile("\\p{script=Latin}").matcher("B").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4187
            !Pattern.compile("\\p{InBasicLatin}").matcher("c").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4188
            !Pattern.compile("\\p{blk=BasicLatin}").matcher("c").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4189
            !Pattern.compile("\\p{block=BasicLatin}").matcher("c").matches())
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4190
            failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4191
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4192
        Matcher common  = Pattern.compile("\\p{script=Common}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4193
        Matcher unknown = Pattern.compile("\\p{IsUnknown}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4194
        Matcher lastSM  = common;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4195
        Character.UnicodeScript lastScript = Character.UnicodeScript.of(0);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4196
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4197
        Matcher latin  = Pattern.compile("\\p{block=basic_latin}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4198
        Matcher greek  = Pattern.compile("\\p{InGreek}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4199
        Matcher lastBM = latin;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4200
        Character.UnicodeBlock lastBlock = Character.UnicodeBlock.of(0);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4201
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4202
        for (int cp = 1; cp < Character.MAX_CODE_POINT; cp++) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4203
            if (cp >= 0x30000 && (cp & 0x70) == 0){
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4204
                continue;  // only pick couple code points, they are the same
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4205
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4206
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4207
            // Unicode Script
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4208
            Character.UnicodeScript script = Character.UnicodeScript.of(cp);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4209
            Matcher m;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4210
            String str = new String(Character.toChars(cp));
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4211
            if (script == lastScript) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4212
                 m = lastSM;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4213
                 m.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4214
            } else {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4215
                 m  = Pattern.compile("\\p{Is" + script.name() + "}").matcher(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4216
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4217
            if (!m.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4218
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4219
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4220
            Matcher other = (script == Character.UnicodeScript.COMMON)? unknown : common;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4221
            other.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4222
            if (other.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4223
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4224
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4225
            lastSM = m;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4226
            lastScript = script;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4227
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4228
            // Unicode Block
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4229
            Character.UnicodeBlock block = Character.UnicodeBlock.of(cp);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4230
            if (block == null) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4231
                //System.out.printf("Not a Block: cp=%x%n", cp);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4232
                continue;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4233
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4234
            if (block == lastBlock) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4235
                 m = lastBM;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4236
                 m.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4237
            } else {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4238
                 m  = Pattern.compile("\\p{block=" + block.toString() + "}").matcher(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4239
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4240
            if (!m.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4241
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4242
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4243
            other = (block == Character.UnicodeBlock.BASIC_LATIN)? greek : latin;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4244
            other.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4245
            if (other.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4246
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4247
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4248
            lastBM = m;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4249
            lastBlock = block;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4250
        }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4251
        report("unicodeProperties");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4252
    }
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4253
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4254
    private static void unicodeHexNotationTest() throws Exception {
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4255
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4256
        // negative
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4257
        checkExpectedFail("\\x{-23}");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4258
        checkExpectedFail("\\x{110000}");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4259
        checkExpectedFail("\\x{}");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4260
        checkExpectedFail("\\x{AB[ef]");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4261
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4262
        // codepoint
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4263
        check("^\\x{1033c}$",              "\uD800\uDF3C", true);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4264
        check("^\\xF0\\x90\\x8C\\xBC$",    "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4265
        check("^\\x{D800}\\x{DF3c}+$",     "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4266
        check("^\\xF0\\x90\\x8C\\xBC$",    "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4267
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4268
        // in class
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4269
        check("^[\\x{D800}\\x{DF3c}]+$",   "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4270
        check("^[\\xF0\\x90\\x8C\\xBC]+$", "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4271
        check("^[\\x{D800}\\x{DF3C}]+$",   "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4272
        check("^[\\x{DF3C}\\x{D800}]+$",   "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4273
        check("^[\\x{D800}\\x{DF3C}]+$",   "\uDF3C\uD800", true);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4274
        check("^[\\x{DF3C}\\x{D800}]+$",   "\uDF3C\uD800", true);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4275
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4276
        for (int cp = 0; cp <= 0x10FFFF; cp++) {
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4277
             String s = "A" + new String(Character.toChars(cp)) + "B";
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4278
             String hexUTF16 = (cp <= 0xFFFF)? String.format("\\u%04x", cp)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4279
                                             : String.format("\\u%04x\\u%04x",
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4280
                                               (int) Character.toChars(cp)[0],
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4281
                                               (int) Character.toChars(cp)[1]);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4282
             String hexCodePoint = "\\x{" + Integer.toHexString(cp) + "}";
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4283
             if (!Pattern.matches("A" + hexUTF16 + "B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4284
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4285
             if (!Pattern.matches("A[" + hexUTF16 + "]B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4286
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4287
             if (!Pattern.matches("A" + hexCodePoint + "B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4288
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4289
             if (!Pattern.matches("A[" + hexCodePoint + "]B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4290
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4291
         }
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4292
         report("unicodeHexNotation");
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4293
    }
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4294
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4295
    private static void unicodeClassesTest() throws Exception {
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4296
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4297
        Matcher lower  = Pattern.compile("\\p{Lower}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4298
        Matcher upper  = Pattern.compile("\\p{Upper}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4299
        Matcher ASCII  = Pattern.compile("\\p{ASCII}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4300
        Matcher alpha  = Pattern.compile("\\p{Alpha}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4301
        Matcher digit  = Pattern.compile("\\p{Digit}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4302
        Matcher alnum  = Pattern.compile("\\p{Alnum}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4303
        Matcher punct  = Pattern.compile("\\p{Punct}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4304
        Matcher graph  = Pattern.compile("\\p{Graph}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4305
        Matcher print  = Pattern.compile("\\p{Print}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4306
        Matcher blank  = Pattern.compile("\\p{Blank}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4307
        Matcher cntrl  = Pattern.compile("\\p{Cntrl}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4308
        Matcher xdigit = Pattern.compile("\\p{XDigit}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4309
        Matcher space  = Pattern.compile("\\p{Space}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4310
        Matcher bound  = Pattern.compile("\\b").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4311
        Matcher word   = Pattern.compile("\\w++").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4312
        // UNICODE_CHARACTER_CLASS
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4313
        Matcher lowerU  = Pattern.compile("\\p{Lower}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4314
        Matcher upperU  = Pattern.compile("\\p{Upper}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4315
        Matcher ASCIIU  = Pattern.compile("\\p{ASCII}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4316
        Matcher alphaU  = Pattern.compile("\\p{Alpha}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4317
        Matcher digitU  = Pattern.compile("\\p{Digit}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4318
        Matcher alnumU  = Pattern.compile("\\p{Alnum}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4319
        Matcher punctU  = Pattern.compile("\\p{Punct}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4320
        Matcher graphU  = Pattern.compile("\\p{Graph}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4321
        Matcher printU  = Pattern.compile("\\p{Print}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4322
        Matcher blankU  = Pattern.compile("\\p{Blank}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4323
        Matcher cntrlU  = Pattern.compile("\\p{Cntrl}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4324
        Matcher xdigitU = Pattern.compile("\\p{XDigit}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4325
        Matcher spaceU  = Pattern.compile("\\p{Space}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4326
        Matcher boundU  = Pattern.compile("\\b", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4327
        Matcher wordU   = Pattern.compile("\\w", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4328
        // embedded flag (?U)
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4329
        Matcher lowerEU  = Pattern.compile("(?U)\\p{Lower}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4330
        Matcher graphEU  = Pattern.compile("(?U)\\p{Graph}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4331
        Matcher wordEU   = Pattern.compile("(?U)\\w", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4332
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4333
        Matcher bwb    = Pattern.compile("\\b\\w\\b").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4334
        Matcher bwbU   = Pattern.compile("\\b\\w++\\b", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4335
        Matcher bwbEU  = Pattern.compile("(?U)\\b\\w++\\b", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4336
        // properties
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4337
        Matcher lowerP  = Pattern.compile("\\p{IsLowerCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4338
        Matcher upperP  = Pattern.compile("\\p{IsUpperCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4339
        Matcher titleP  = Pattern.compile("\\p{IsTitleCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4340
        Matcher letterP = Pattern.compile("\\p{IsLetter}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4341
        Matcher alphaP  = Pattern.compile("\\p{IsAlphabetic}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4342
        Matcher ideogP  = Pattern.compile("\\p{IsIdeographic}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4343
        Matcher cntrlP  = Pattern.compile("\\p{IsControl}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4344
        Matcher spaceP  = Pattern.compile("\\p{IsWhiteSpace}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4345
        Matcher definedP = Pattern.compile("\\p{IsAssigned}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4346
        Matcher nonCCPP = Pattern.compile("\\p{IsNoncharacterCodePoint}").matcher("");
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4347
        Matcher joinCrtl = Pattern.compile("\\p{IsJoinControl}").matcher("");
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4348
        // javaMethod
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4349
        Matcher lowerJ  = Pattern.compile("\\p{javaLowerCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4350
        Matcher upperJ  = Pattern.compile("\\p{javaUpperCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4351
        Matcher alphaJ  = Pattern.compile("\\p{javaAlphabetic}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4352
        Matcher ideogJ  = Pattern.compile("\\p{javaIdeographic}").matcher("");
38450
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4353
        // GC/C
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4354
        Matcher gcC  = Pattern.compile("\\p{C}").matcher("");
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4355
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4356
        for (int cp = 1; cp < 0x30000; cp++) {
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4357
            String str = new String(Character.toChars(cp));
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4358
            int type = Character.getType(cp);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4359
            if (// lower
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4360
                POSIX_ASCII.isLower(cp)   != lower.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4361
                Character.isLowerCase(cp) != lowerU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4362
                Character.isLowerCase(cp) != lowerP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4363
                Character.isLowerCase(cp) != lowerEU.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4364
                Character.isLowerCase(cp) != lowerJ.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4365
                // upper
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4366
                POSIX_ASCII.isUpper(cp)   != upper.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4367
                POSIX_Unicode.isUpper(cp) != upperU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4368
                Character.isUpperCase(cp) != upperP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4369
                Character.isUpperCase(cp) != upperJ.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4370
                // alpha
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4371
                POSIX_ASCII.isAlpha(cp)   != alpha.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4372
                POSIX_Unicode.isAlpha(cp) != alphaU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4373
                Character.isAlphabetic(cp)!= alphaP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4374
                Character.isAlphabetic(cp)!= alphaJ.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4375
                // digit
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4376
                POSIX_ASCII.isDigit(cp)   != digit.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4377
                Character.isDigit(cp)     != digitU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4378
                // alnum
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4379
                POSIX_ASCII.isAlnum(cp)   != alnum.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4380
                POSIX_Unicode.isAlnum(cp) != alnumU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4381
                // punct
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4382
                POSIX_ASCII.isPunct(cp)   != punct.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4383
                POSIX_Unicode.isPunct(cp) != punctU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4384
                // graph
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4385
                POSIX_ASCII.isGraph(cp)   != graph.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4386
                POSIX_Unicode.isGraph(cp) != graphU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4387
                POSIX_Unicode.isGraph(cp) != graphEU.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4388
                // blank
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4389
                POSIX_ASCII.isType(cp, POSIX_ASCII.BLANK)
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4390
                                          != blank.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4391
                POSIX_Unicode.isBlank(cp) != blankU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4392
                // print
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4393
                POSIX_ASCII.isPrint(cp)   != print.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4394
                POSIX_Unicode.isPrint(cp) != printU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4395
                // cntrl
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4396
                POSIX_ASCII.isCntrl(cp)   != cntrl.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4397
                POSIX_Unicode.isCntrl(cp) != cntrlU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4398
                (Character.CONTROL == type) != cntrlP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4399
                // hexdigit
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4400
                POSIX_ASCII.isHexDigit(cp)   != xdigit.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4401
                POSIX_Unicode.isHexDigit(cp) != xdigitU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4402
                // space
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4403
                POSIX_ASCII.isSpace(cp)   != space.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4404
                POSIX_Unicode.isSpace(cp) != spaceU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4405
                POSIX_Unicode.isSpace(cp) != spaceP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4406
                // word
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4407
                POSIX_ASCII.isWord(cp)   != word.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4408
                POSIX_Unicode.isWord(cp) != wordU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4409
                POSIX_Unicode.isWord(cp) != wordEU.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4410
                // bwordb
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4411
                POSIX_ASCII.isWord(cp) != bwb.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4412
                POSIX_Unicode.isWord(cp) != bwbU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4413
                // properties
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4414
                Character.isTitleCase(cp) != titleP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4415
                Character.isLetter(cp)    != letterP.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4416
                Character.isIdeographic(cp) != ideogP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4417
                Character.isIdeographic(cp) != ideogJ.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4418
                (Character.UNASSIGNED == type) == definedP.reset(str).matches() ||
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4419
                POSIX_Unicode.isNoncharacterCodePoint(cp) != nonCCPP.reset(str).matches() ||
38450
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4420
                POSIX_Unicode.isJoinControl(cp) != joinCrtl.reset(str).matches() ||
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4421
                // gc_C
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4422
                (Character.CONTROL == type || Character.FORMAT == type ||
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4423
                 Character.PRIVATE_USE == type || Character.SURROGATE == type ||
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4424
                 Character.UNASSIGNED == type)
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4425
                != gcC.reset(str).matches()) {
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4426
                failCount++;
38450
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4427
            }
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4428
        }
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4429
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4430
        // bounds/word align
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4431
        twoFindIndexes(" \u0180sherman\u0400 ", bound, 1, 10);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4432
        if (!bwbU.reset("\u0180sherman\u0400").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4433
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4434
        twoFindIndexes(" \u0180sh\u0345erman\u0400 ", bound, 1, 11);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4435
        if (!bwbU.reset("\u0180sh\u0345erman\u0400").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4436
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4437
        twoFindIndexes(" \u0724\u0739\u0724 ", bound, 1, 4);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4438
        if (!bwbU.reset("\u0724\u0739\u0724").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4439
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4440
        if (!bwbEU.reset("\u0724\u0739\u0724").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4441
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4442
        report("unicodePredefinedClasses");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4443
    }
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4444
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4445
    private static void unicodeCharacterNameTest() throws Exception {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4446
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4447
        for (int cp = 0; cp < Character.MAX_CODE_POINT; cp++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4448
            if (!Character.isValidCodePoint(cp) ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4449
                Character.getType(cp) == Character.UNASSIGNED)
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4450
                continue;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4451
            String str = new String(Character.toChars(cp));
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4452
            // single
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4453
            String p = "\\N{" + Character.getName(cp) + "}";
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4454
            if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4455
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4456
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4457
            // class[c]
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4458
            p = "[\\N{" + Character.getName(cp) + "}]";
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4459
            if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4460
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4461
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4462
        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4463
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4464
        // range
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4465
        for (int i = 0; i < 10; i++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4466
            int start = generator.nextInt(20);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4467
            int end = start + generator.nextInt(200);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4468
            String p = "[\\N{" + Character.getName(start) + "}-\\N{" + Character.getName(end) + "}]";
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4469
            String str;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4470
            for (int cp = start; cp < end; cp++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4471
                str = new String(Character.toChars(cp));
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4472
                if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4473
                    failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4474
                }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4475
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4476
            str = new String(Character.toChars(end + 10));
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4477
            if (Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4478
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4479
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4480
        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4481
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4482
        // slice
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4483
        for (int i = 0; i < 10; i++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4484
            int n = generator.nextInt(256);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4485
            int[] buf = new int[n];
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4486
            StringBuffer sb = new StringBuffer(1024);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4487
            for (int j = 0; j < n; j++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4488
                int cp = generator.nextInt(1000);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4489
                if (!Character.isValidCodePoint(cp) ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4490
                    Character.getType(cp) == Character.UNASSIGNED)
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4491
                    cp = 0x4e00;    // just use 4e00
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4492
                sb.append("\\N{" + Character.getName(cp) + "}");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4493
                buf[j] = cp;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4494
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4495
            String p = sb.toString();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4496
            String str = new String(buf, 0, buf.length);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4497
            if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4498
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4499
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4500
        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4501
        report("unicodeCharacterName");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4502
    }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4503
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4504
    private static void horizontalAndVerticalWSTest() throws Exception {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4505
        String hws = new String (new char[] {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4506
                                     0x09, 0x20, 0xa0, 0x1680, 0x180e,
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4507
                                     0x2000, 0x2001, 0x2002, 0x2003, 0x2004, 0x2005,
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4508
                                     0x2006, 0x2007, 0x2008, 0x2009, 0x200a,
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4509
                                     0x202f, 0x205f, 0x3000 });
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4510
        String vws = new String (new char[] {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4511
                                     0x0a, 0x0b, 0x0c, 0x0d, 0x85, 0x2028, 0x2029 });
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4512
        if (!Pattern.compile("\\h+").matcher(hws).matches() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4513
            !Pattern.compile("[\\h]+").matcher(hws).matches())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4514
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4515
        if (Pattern.compile("\\H").matcher(hws).find() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4516
            Pattern.compile("[\\H]").matcher(hws).find())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4517
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4518
        if (!Pattern.compile("\\v+").matcher(vws).matches() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4519
            !Pattern.compile("[\\v]+").matcher(vws).matches())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4520
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4521
        if (Pattern.compile("\\V").matcher(vws).find() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4522
            Pattern.compile("[\\V]").matcher(vws).find())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4523
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4524
        String prefix = "abcd";
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4525
        String suffix = "efgh";
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4526
        String ng = "A";
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4527
        for (int i = 0; i < hws.length(); i++) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4528
            String c = String.valueOf(hws.charAt(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4529
            Matcher m = Pattern.compile("\\h").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4530
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4531
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4532
            m = Pattern.compile("[\\h]").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4533
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4534
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4535
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4536
            m = Pattern.compile("\\H").matcher(hws.substring(0, i) + ng + hws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4537
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4538
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4539
            m = Pattern.compile("[\\H]").matcher(hws.substring(0, i) + ng + hws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4540
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4541
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4542
        }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4543
        for (int i = 0; i < vws.length(); i++) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4544
            String c = String.valueOf(vws.charAt(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4545
            Matcher m = Pattern.compile("\\v").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4546
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4547
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4548
            m = Pattern.compile("[\\v]").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4549
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4550
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4551
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4552
            m = Pattern.compile("\\V").matcher(vws.substring(0, i) + ng + vws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4553
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4554
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4555
            m = Pattern.compile("[\\V]").matcher(vws.substring(0, i) + ng + vws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4556
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4557
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4558
        }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4559
        // \v in range is interpreted as 0x0B. This is the undocumented behavior
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4560
        if (!Pattern.compile("[\\v-\\v]").matcher(String.valueOf((char)0x0B)).matches())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4561
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4562
        report("horizontalAndVerticalWSTest");
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4563
    }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4564
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4565
    private static void linebreakTest() throws Exception {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4566
        String linebreaks = new String (new char[] {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4567
            0x0A, 0x0B, 0x0C, 0x0D, 0x85, 0x2028, 0x2029 });
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4568
        String crnl = "\r\n";
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4569
        if (!Pattern.compile("\\R+").matcher(linebreaks).matches() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4570
            !Pattern.compile("\\R").matcher(crnl).matches() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4571
            Pattern.compile("\\R\\R").matcher(crnl).matches())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4572
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4573
        report("linebreakTest");
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4574
    }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4575
13554
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4576
    // #7189363
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4577
    private static void branchTest() throws Exception {
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4578
        if (!Pattern.compile("(a)?bc|d").matcher("d").find() ||     // greedy
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4579
            !Pattern.compile("(a)+bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4580
            !Pattern.compile("(a)*bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4581
            !Pattern.compile("(a)??bc|d").matcher("d").find() ||    // reluctant
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4582
            !Pattern.compile("(a)+?bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4583
            !Pattern.compile("(a)*?bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4584
            !Pattern.compile("(a)?+bc|d").matcher("d").find() ||    // possessive
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4585
            !Pattern.compile("(a)++bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4586
            !Pattern.compile("(a)*+bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4587
            !Pattern.compile("(a)?bc|d").matcher("d").matches() ||  // greedy
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4588
            !Pattern.compile("(a)+bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4589
            !Pattern.compile("(a)*bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4590
            !Pattern.compile("(a)??bc|d").matcher("d").matches() || // reluctant
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4591
            !Pattern.compile("(a)+?bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4592
            !Pattern.compile("(a)*?bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4593
            !Pattern.compile("(a)?+bc|d").matcher("d").matches() || // possessive
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4594
            !Pattern.compile("(a)++bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4595
            !Pattern.compile("(a)*+bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4596
            !Pattern.compile("(a)?bc|de").matcher("de").find() ||   // others
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4597
            !Pattern.compile("(a)??bc|de").matcher("de").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4598
            !Pattern.compile("(a)?bc|de").matcher("de").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4599
            !Pattern.compile("(a)??bc|de").matcher("de").matches())
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4600
            failCount++;
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4601
        report("branchTest");
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4602
    }
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4603
17183
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4604
    // This test is for 8007395
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4605
    private static void groupCurlyNotFoundSuppTest() throws Exception {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4606
        String input = "test this as \ud83d\ude0d";
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4607
        for (String pStr : new String[] { "test(.)+(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4608
                                          "test(.)*(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4609
                                          "test([^B])+(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4610
                                          "test([^B])*(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4611
                                          "test(\\P{IsControl})+(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4612
                                          "test(\\P{IsControl})*(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4613
                                        }) {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4614
            Matcher m = Pattern.compile(pStr, Pattern.CASE_INSENSITIVE)
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4615
                               .matcher(input);
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4616
            try {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4617
                if (m.find()) {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4618
                    failCount++;
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4619
                }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4620
            } catch (Exception x) {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4621
                failCount++;
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4622
            }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4623
        }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4624
        report("GroupCurly NotFoundSupp");
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4625
    }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4626
19604
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4627
    // This test is for 8023647
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4628
    private static void groupCurlyBackoffTest() throws Exception {
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4629
        if (!"abc1c".matches("(\\w)+1\\1") ||
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4630
            "abc11".matches("(\\w)+1\\1")) {
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4631
            failCount++;
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4632
        }
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4633
        report("GroupCurly backoff");
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4634
    }
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4635
17447
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4636
    // This test is for 8012646
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4637
    private static void patternAsPredicate() throws Exception {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4638
        Predicate<String> p = Pattern.compile("[a-z]+").asPredicate();
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4639
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4640
        if (p.test("")) {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4641
            failCount++;
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4642
        }
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4643
        if (!p.test("word")) {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4644
            failCount++;
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4645
        }
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4646
        if (p.test("1234")) {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4647
            failCount++;
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4648
        }
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4649
        report("Pattern.asPredicate");
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4650
    }
25523
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4651
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4652
    // This test is for 8035975
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4653
    private static void invalidFlags() throws Exception {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4654
        for (int flag = 1; flag != 0; flag <<= 1) {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4655
            switch (flag) {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4656
            case Pattern.CASE_INSENSITIVE:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4657
            case Pattern.MULTILINE:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4658
            case Pattern.DOTALL:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4659
            case Pattern.UNICODE_CASE:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4660
            case Pattern.CANON_EQ:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4661
            case Pattern.UNIX_LINES:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4662
            case Pattern.LITERAL:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4663
            case Pattern.UNICODE_CHARACTER_CLASS:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4664
            case Pattern.COMMENTS:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4665
                // valid flag, continue
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4666
                break;
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4667
            default:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4668
                try {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4669
                    Pattern.compile(".", flag);
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4670
                    failCount++;
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4671
                } catch (IllegalArgumentException expected) {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4672
                }
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4673
            }
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4674
        }
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4675
        report("Invalid compile flags");
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4676
    }
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4677
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4678
    private static void grapheme() throws Exception {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4679
        Files.lines(Paths.get(System.getProperty("test.src", "."),
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4680
                              "GraphemeBreakTest.txt"))
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4681
            .filter( ln -> ln.length() != 0 && !ln.startsWith("#") )
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4682
            .forEach( ln -> {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4683
                    ln = ln.replaceAll("\\s+|\\([a-zA-Z]+\\)|\\[[a-zA-Z]]+\\]|#.*", "");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4684
                    // System.out.println(str);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4685
                    String[] strs = ln.split("\u00f7|\u00d7");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4686
                    StringBuilder src = new StringBuilder();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4687
                    ArrayList<String> graphemes = new ArrayList<>();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4688
                    StringBuilder buf = new StringBuilder();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4689
                    int offBk = 0;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4690
                    for (String str : strs) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4691
                        if (str.length() == 0)  // first empty str
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4692
                            continue;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4693
                        int cp = Integer.parseInt(str, 16);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4694
                        src.appendCodePoint(cp);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4695
                        buf.appendCodePoint(cp);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4696
                        offBk += (str.length() + 1);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4697
                        if (ln.charAt(offBk) == '\u00f7') {    // DIV
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4698
                            graphemes.add(buf.toString());
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4699
                            buf = new StringBuilder();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4700
                        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4701
                    }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4702
                    Pattern p = Pattern.compile("\\X");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4703
                    Matcher m = p.matcher(src.toString());
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4704
                    Scanner s = new Scanner(src.toString()).useDelimiter("\\b{g}");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4705
                    for (String g : graphemes) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4706
                        // System.out.printf("     grapheme:=[%s]%n", g);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4707
                        // (1) test \\X directly
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4708
                        if (!m.find() || !m.group().equals(g)) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4709
                            System.out.println("Failed \\X [" + ln + "] : " + g);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4710
                            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4711
                        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4712
                        // (2) test \\b{g} + \\X  via Scanner
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4713
                        boolean hasNext = s.hasNext(p);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4714
                        // if (!s.hasNext() || !s.next().equals(next)) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4715
                        if (!s.hasNext(p) || !s.next(p).equals(g)) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4716
                            System.out.println("Failed b{g} [" + ln + "] : " + g);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4717
                            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4718
                        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4719
                    }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4720
                });
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4721
        // some sanity checks
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4722
        if (!Pattern.compile("\\X{10}").matcher("abcdefghij").matches() ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4723
            !Pattern.compile("\\b{g}(?:\\X\\b{g}){5}\\b{g}").matcher("abcde").matches() ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4724
            !Pattern.compile("(?:\\X\\b{g}){2}").matcher("\ud800\udc00\ud801\udc02").matches())
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4725
            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4726
        // make sure "\b{n}" still works
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4727
        if (!Pattern.compile("\\b{1}hello\\b{1} \\b{1}world\\b{1}").matcher("hello world").matches())
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4728
            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4729
        report("Unicode extended grapheme cluster");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4730
    }
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4731
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4732
    // hangup/timeout if go into exponential backtracking
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4733
    private static void expoBacktracking() throws Exception {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4734
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4735
        Object[][] patternMatchers = {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4736
            // 6328855
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4737
            { "(.*\n*)*",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4738
              "this little fine string lets\r\njava.lang.String.matches\r\ncrash\r\n(We don't know why but adding \r* to the regex makes it work again)",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4739
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4740
            // 6192895
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4741
            { " *([a-zA-Z0-9/\\-\\?:\\(\\)\\.,'\\+\\{\\}]+ *)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4742
              "Hello World this is a test this is a test this is a test A",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4743
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4744
            { " *([a-zA-Z0-9/\\-\\?:\\(\\)\\.,'\\+\\{\\}]+ *)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4745
              "Hello World this is a test this is a test this is a test \u4e00 ",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4746
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4747
            { " *([a-z0-9]+ *)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4748
              "hello world this is a test this is a test this is a test A",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4749
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4750
            // 4771934 [FIXED] #5013651?
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4751
            { "^(\\w+([\\.-]?\\w+)*@\\w+([\\.-]?\\w+)*(\\.\\w{2,4})+[,;]?)+$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4752
              "abc@efg.abc,efg@abc.abc,abc@xyz.mno;abc@sdfsd.com",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4753
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4754
            // 4866249 [FIXED]
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4755
            { "<\\s*" + "(meta|META)" + "(\\s|[^>])+" + "(CHARSET|charset)=" + "(\\s|[^>])+>",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4756
              "<META http-equiv=\"Content-Type\" content=\"text/html; charset=ISO-8859-5\">",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4757
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4758
            { "^(\\w+([\\.-]?\\w+)*@\\w+([\\.-]?\\w+)*(\\.\\w{2,4})+[,;]?)+$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4759
              "abc@efg.abc,efg@abc.abc,abc@xyz.mno;sdfsd.com",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4760
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4761
            // 6345469
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4762
            { "((<[^>]+>)?(((\\s)?)*(\\&nbsp;)?)*((\\s)?)*)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4763
              "&nbsp;&nbsp; < br/> &nbsp; < / p> <p> <html> <adfasfdasdf>&nbsp; </p>",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4764
              true }, // --> matched
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4765
            { "((<[^>]+>)?(((\\s)?)*(\\&nbsp;)?)*((\\s)?)*)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4766
              "&nbsp;&nbsp; < br/> &nbsp; < / p> <p> <html> <adfasfdasdf>&nbsp; p </p>",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4767
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4768
            // 5026912
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4769
            { "^\\s*" + "(\\w|\\d|[\\xC0-\\xFF]|/)+" + "\\s+|$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4770
              "156580451111112225588087755221111111566969655555555",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4771
              false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4772
            // 6988218
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4773
            { "^([+-]?((0[xX](\\p{XDigit}+))|(((\\p{Digit}+)(\\.)?((\\p{Digit}+)?)([eE][+-]?(\\p{Digit}+))?)|(\\.((\\p{Digit}+))([eE][+-]?(\\p{Digit}+))?)))|[n|N]?'([^']*(?:'')*[^']*)*')",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4774
              "'%)) order by ANGEBOT.ID",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4775
              false},    // find
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4776
            // 6693451
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4777
            { "^(\\s*foo\\s*)*$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4778
              "foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4779
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4780
            { "^(\\s*foo\\s*)*$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4781
              "foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo fo",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4782
              false
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4783
            },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4784
            // 7006761
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4785
            { "(([0-9A-Z]+)([_]?+)*)*", "FOOOOO_BAAAR_FOOOOOOOOO_BA_", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4786
            { "(([0-9A-Z]+)([_]?+)*)*", "FOOOOO_BAAAR_FOOOOOOOOO_BA_ ", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4787
            // 8140212
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4788
            { "(?<before>.*)\\{(?<reflection>\\w+):(?<innerMethod>\\w+(\\.?\\w+(\\(((?<args>(('[^']*')|((/|\\w)+))(,(('[^']*')|((/|\\w)+)))*))?\\))?)*)\\}(?<after>.*)",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4789
              "{CeGlobal:getSodCutoff.getGui.getAmqp.getSimpleModeEnabled()",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4790
              false
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4791
            },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4792
            { "^(a+)+$", "aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4793
            { "^(a+)+$", "aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa!", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4794
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4795
            { "(x+)*y",  "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxy", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4796
            { "(x+)*y",  "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxz", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4797
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4798
            { "(x+x+)+y", "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxy", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4799
            { "(x+x+)+y", "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxz", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4800
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4801
            { "(([0-9A-Z]+)([_]?+)*)*", "--------------------------------------", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4802
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4803
            /* not fixed
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4804
            //8132141   --->    second level exponential backtracking
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4805
            { "(h|h|ih(((i|a|c|c|a|i|i|j|b|a|i|b|a|a|j))+h)ahbfhba|c|i)*",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4806
              "hchcchicihcchciiicichhcichcihcchiihichiciiiihhcchicchhcihchcihiihciichhccciccichcichiihcchcihhicchcciicchcccihiiihhihihihichicihhcciccchihhhcchichchciihiicihciihcccciciccicciiiiiiiiicihhhiiiihchccchchhhhiiihchihcccchhhiiiiiiiicicichicihcciciihichhhhchihciiihhiccccccciciihhichiccchhicchicihihccichicciihcichccihhiciccccccccichhhhihihhcchchihihiihhihihihicichihiiiihhhhihhhchhichiicihhiiiiihchccccchichci" },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4807
            */
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4808
        };
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4809
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4810
        for (Object[] pm : patternMatchers) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4811
            String p = (String)pm[0];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4812
            String s = (String)pm[1];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4813
            boolean r = (Boolean)pm[2];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4814
            if (r != Pattern.compile(p).matcher(s).matches()) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4815
                failCount++;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4816
            }
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4817
        }
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4818
    }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4819
}