test/jdk/java/util/regex/RegExTest.java
author sherman
Fri, 12 Jan 2018 14:05:42 -0800
changeset 48491 7f11a1699ef6
parent 47216 71c04702a3d5
child 48853 84b4ffbba8b0
permissions -rw-r--r--
8194667: Regex: Serialization doesn't work with match flags Reviewed-by: rriggs
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     1
/*
48491
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
     2
 * Copyright (c) 1999, 2018, Oracle and/or its affiliates. All rights reserved.
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     4
 *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
21596
0e3a39f29dbc 8027696: Incorrect copyright header in the tests
serb
parents: 19604
diff changeset
     7
 * published by the Free Software Foundation.
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     8
 *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
     9
 * This code is distributed in the hope that it will be useful, but WITHOUT
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    12
 * version 2 for more details (a copy is included in the LICENSE file that
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    13
 * accompanied this code).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    14
 *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    15
 * You should have received a copy of the GNU General Public License version
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    16
 * 2 along with this work; if not, write to the Free Software Foundation,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    18
 *
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 5295
diff changeset
    19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 5295
diff changeset
    20
 * or visit www.oracle.com if you need additional information or have any
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 5295
diff changeset
    21
 * questions.
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    22
 */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    23
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    24
/**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    25
 * @test
30370
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    26
 * @summary tests RegExp framework (use -Dseed=X to set PRNG seed)
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    27
 * @author Mike McCloskey
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    28
 * @bug 4481568 4482696 4495089 4504687 4527731 4599621 4631553 4619345
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    29
 * 4630911 4672616 4711773 4727935 4750573 4792284 4803197 4757029 4808962
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    30
 * 4872664 4803179 4892980 4900747 4945394 4938995 4979006 4994840 4997476
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    31
 * 5013885 5003322 4988891 5098443 5110268 6173522 4829857 5027748 6376940
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    32
 * 6358731 6178785 6284152 6231989 6497148 6486934 6233084 6504326 6635133
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
    33
 * 6350801 6676425 6878475 6919132 6931676 6948903 6990617 7014645 7039066
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
    34
 * 7067045 7014640 7189363 8007395 8013252 8013254 8012646 8023647 6559590
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
    35
 * 8027645 8035076 8039124 8035975 8074678 6854417 8143854 8147531 7071819
45888
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
    36
 * 8151481 4867170 7080302 6728861 6995635 6736245 4916384 6328855 6192895
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
    37
 * 6345469 6988218 6693451 7006761 8140212 8143282 8158482 8176029 8184706
48491
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
    38
 * 8194667
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
    39
 *
45288
58be10a068c2 8180805: move RandomFactory to the top level testlibrary
iignatyev
parents: 44122
diff changeset
    40
 * @library /test/lib
45466
faf1c55d2046 8181759: add explicit @build actions for jdk.test.lib classes in all :tier1 tests
iignatyev
parents: 45288
diff changeset
    41
 * @build jdk.test.lib.RandomFactory
30370
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    42
 * @run main RegExTest
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
    43
 * @key randomness
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    44
 */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    45
29243
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
    46
import java.util.function.Function;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    47
import java.util.regex.*;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    48
import java.util.Random;
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
    49
import java.util.Scanner;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    50
import java.io.*;
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
    51
import java.nio.file.*;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    52
import java.util.*;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    53
import java.nio.CharBuffer;
17447
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
    54
import java.util.function.Predicate;
45288
58be10a068c2 8180805: move RandomFactory to the top level testlibrary
iignatyev
parents: 44122
diff changeset
    55
import jdk.test.lib.RandomFactory;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    56
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    57
/**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    58
 * This is a test class created to check the operation of
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    59
 * the Pattern and Matcher classes.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    60
 */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    61
public class RegExTest {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    62
30370
984bf40cdc67 8079419: Update to RegEx test to use random number library
darcy
parents: 30046
diff changeset
    63
    private static Random generator = RandomFactory.getRandom();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    64
    private static boolean failure = false;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    65
    private static int failCount = 0;
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
    66
    private static String firstFailure = null;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    67
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    68
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    69
     * Main to interpret arguments and run several tests.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    70
     *
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    71
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    72
    public static void main(String[] args) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    73
        // Most of the tests are in a file
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    74
        processFile("TestCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    75
        //processFile("PerlCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    76
        processFile("BMPTestCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    77
        processFile("SupplementaryTestCases.txt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    78
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    79
        // These test many randomly generated char patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    80
        bm();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    81
        slice();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    82
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    83
        // These are hard to put into the file
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    84
        escapes();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    85
        blankInput();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    86
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    87
        // Substitition tests on randomly generated sequences
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    88
        globalSubstitute();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    89
        stringbufferSubstitute();
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
    90
        stringbuilderSubstitute();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
    91
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    92
        substitutionBasher();
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
    93
        substitutionBasher2();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    94
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    95
        // Canonical Equivalence
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    96
        ceTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    97
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    98
        // Anchors
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
    99
        anchorTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   100
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   101
        // boolean match calls
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   102
        matchesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   103
        lookingAtTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   104
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   105
        // Pattern API
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   106
        patternMatchesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   107
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   108
        // Misc
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   109
        lookbehindTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   110
        nullArgumentTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   111
        backRefTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   112
        groupCaptureTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   113
        caretTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   114
        charClassTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   115
        emptyPatternTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   116
        findIntTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   117
        group0Test();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   118
        longPatternTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   119
        octalTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   120
        ampersandTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   121
        negationTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   122
        splitTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   123
        appendTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   124
        caseFoldingTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   125
        commentsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   126
        unixLinesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   127
        replaceFirstTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   128
        gTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   129
        zTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   130
        serializeTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   131
        reluctantRepetitionTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   132
        multilineDollarTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   133
        dollarAtEndTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   134
        caretBetweenTerminatorsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   135
        // This RFE rejected in Tiger numOccurrencesTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   136
        javaCharClassTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   137
        nonCaptureRepetitionTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   138
        notCapturedGroupCurlyMatchTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   139
        escapedSegmentTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   140
        literalPatternTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   141
        literalReplacementTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   142
        regionTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   143
        toStringTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   144
        negatedCharClassTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   145
        findFromTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   146
        boundsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   147
        unicodeWordBoundsTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   148
        caretAtEndTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   149
        wordSearchTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   150
        hitEndTest();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   151
        toMatchResultTest();
29503
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   152
        toMatchResultTest2();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   153
        surrogatesInClassTest();
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   154
        removeQEQuotingTest();
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   155
        namedGroupCaptureTest();
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
   156
        nonBmpClassComplementTest();
5610
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
   157
        unicodePropertiesTest();
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   158
        unicodeHexNotationTest();
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
   159
        unicodeClassesTest();
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
   160
        unicodeCharacterNameTest();
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   161
        horizontalAndVerticalWSTest();
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   162
        linebreakTest();
13554
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
   163
        branchTest();
17183
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
   164
        groupCurlyNotFoundSuppTest();
19604
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
   165
        groupCurlyBackoffTest();
17447
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
   166
        patternAsPredicate();
25523
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
   167
        invalidFlags();
38777
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
   168
        embeddedFlags();
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
   169
        grapheme();
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
   170
        expoBacktracking();
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
   171
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   172
        if (failure) {
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   173
            throw new
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   174
                RuntimeException("RegExTest failed, 1st failure: " +
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   175
                                 firstFailure);
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   176
        } else {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   177
            System.err.println("OKAY: All tests passed.");
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   178
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   179
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   180
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   181
    // Utility functions
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   182
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   183
    private static String getRandomAlphaString(int length) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   184
        StringBuffer buf = new StringBuffer(length);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   185
        for (int i=0; i<length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   186
            char randChar = (char)(97 + generator.nextInt(26));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   187
            buf.append(randChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   188
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   189
        return buf.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   190
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   191
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   192
    private static void check(Matcher m, String expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   193
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   194
        if (!m.group().equals(expected))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   195
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   196
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   197
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   198
    private static void check(Matcher m, String result, boolean expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   199
        m.find();
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   200
        if (m.group().equals(result) != expected)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   201
            failCount++;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   202
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   203
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   204
    private static void check(Pattern p, String s, boolean expected) {
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   205
        if (p.matcher(s).find() != expected)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   206
            failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   207
    }
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   208
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   209
    private static void check(String p, String s, boolean expected) {
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   210
        Matcher matcher = Pattern.compile(p).matcher(s);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   211
        if (matcher.find() != expected)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
   212
            failCount++;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   213
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   214
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   215
    private static void check(String p, char c, boolean expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   216
        String propertyPattern = expected ? "\\p" + p : "\\P" + p;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   217
        Pattern pattern = Pattern.compile(propertyPattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   218
        char[] ca = new char[1]; ca[0] = c;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   219
        Matcher matcher = pattern.matcher(new String(ca));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   220
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   221
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   222
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   223
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   224
    private static void check(String p, int codePoint, boolean expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   225
        String propertyPattern = expected ? "\\p" + p : "\\P" + p;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   226
        Pattern pattern = Pattern.compile(propertyPattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   227
        char[] ca = Character.toChars(codePoint);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   228
        Matcher matcher = pattern.matcher(new String(ca));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   229
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   230
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   231
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   232
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   233
    private static void check(String p, int flag, String input, String s,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   234
                              boolean expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   235
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   236
        Pattern pattern = Pattern.compile(p, flag);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   237
        Matcher matcher = pattern.matcher(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   238
        if (expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   239
            check(matcher, s, expected);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   240
        else
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   241
            check(pattern, input, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   242
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   243
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   244
    private static void report(String testName) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   245
        int spacesToAdd = 30 - testName.length();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   246
        StringBuffer paddedNameBuffer = new StringBuffer(testName);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   247
        for (int i=0; i<spacesToAdd; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   248
            paddedNameBuffer.append(" ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   249
        String paddedName = paddedNameBuffer.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   250
        System.err.println(paddedName + ": " +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   251
                           (failCount==0 ? "Passed":"Failed("+failCount+")"));
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   252
        if (failCount > 0) {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   253
            failure = true;
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   254
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   255
            if (firstFailure == null) {
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   256
                firstFailure = testName;
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   257
            }
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   258
        }
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   259
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   260
        failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   261
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   262
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   263
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   264
     * Converts ASCII alphabet characters [A-Za-z] in the given 's' to
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   265
     * supplementary characters. This method does NOT fully take care
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   266
     * of the regex syntax.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   267
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   268
    private static String toSupplementaries(String s) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   269
        int length = s.length();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   270
        StringBuffer sb = new StringBuffer(length * 2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   271
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   272
        for (int i = 0; i < length; ) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   273
            char c = s.charAt(i++);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   274
            if (c == '\\') {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   275
                sb.append(c);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   276
                if (i < length) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   277
                    c = s.charAt(i++);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   278
                    sb.append(c);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   279
                    if (c == 'u') {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   280
                        // assume no syntax error
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   281
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   282
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   283
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   284
                        sb.append(s.charAt(i++));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   285
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   286
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   287
            } else if ((c >= 'A' && c <= 'Z') || (c >= 'a' && c <= 'z')) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   288
                sb.append('\ud800').append((char)('\udc00'+c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   289
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   290
                sb.append(c);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   291
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   292
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   293
        return sb.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   294
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   295
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   296
    // Regular expression tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   297
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   298
    // This is for bug 6178785
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   299
    // Test if an expected NPE gets thrown when passing in a null argument
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   300
    private static boolean check(Runnable test) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   301
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   302
            test.run();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   303
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   304
            return false;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   305
        } catch (NullPointerException npe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   306
            return true;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   307
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   308
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   309
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   310
    private static void nullArgumentTest() {
29243
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   311
        check(() -> Pattern.compile(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   312
        check(() -> Pattern.matches(null, null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   313
        check(() -> Pattern.matches("xyz", null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   314
        check(() -> Pattern.quote(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   315
        check(() -> Pattern.compile("xyz").split(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   316
        check(() -> Pattern.compile("xyz").matcher(null));
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   317
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   318
        final Matcher m = Pattern.compile("xyz").matcher("xyz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   319
        m.matches();
29243
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   320
        check(() -> m.appendTail((StringBuffer) null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   321
        check(() -> m.appendTail((StringBuilder)null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   322
        check(() -> m.replaceAll((String) null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   323
        check(() -> m.replaceAll((Function<MatchResult, String>)null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   324
        check(() -> m.replaceFirst((String)null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   325
        check(() -> m.replaceFirst((Function<MatchResult, String>) null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   326
        check(() -> m.appendReplacement((StringBuffer)null, null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   327
        check(() -> m.appendReplacement((StringBuilder)null, null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   328
        check(() -> m.reset(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   329
        check(() -> Matcher.quoteReplacement(null));
80ea8d3d39d0 8071479: Stream and lambdafication improvements to j.u.regex.Matcher
psandoz
parents: 25523
diff changeset
   330
        //check(() -> m.usePattern(null));
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   331
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   332
        report("Null Argument");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   333
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   334
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   335
    // This is for bug6635133
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   336
    // Test if surrogate pair in Unicode escapes can be handled correctly.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   337
    private static void surrogatesInClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   338
        Pattern pattern = Pattern.compile("[\\ud834\\udd21-\\ud834\\udd24]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   339
        Matcher matcher = pattern.matcher("\ud834\udd22");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   340
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   341
            failCount++;
11287
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   342
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   343
        report("Surrogate pair in Unicode escape");
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   344
    }
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   345
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   346
    // This is for bug6990617
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   347
    // Test if Pattern.RemoveQEQuoting works correctly if the octal unicode
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   348
    // char encoding is only 2 or 3 digits instead of 4 and the first quoted
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   349
    // char is an octal digit.
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   350
    private static void removeQEQuotingTest() throws Exception {
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   351
        Pattern pattern =
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   352
            Pattern.compile("\\011\\Q1sometext\\E\\011\\Q2sometext\\E");
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   353
        Matcher matcher = pattern.matcher("\t1sometext\t2sometext");
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   354
        if (!matcher.find())
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   355
            failCount++;
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   356
3db172a5433c 6990617: Regular expression doesn't match if unicode character next to a digit.
sherman
parents: 9536
diff changeset
   357
        report("Remove Q/E Quoting");
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   358
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   359
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   360
    // This is for bug 4988891
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   361
    // Test toMatchResult to see that it is a copy of the Matcher
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   362
    // that is not affected by subsequent operations on the original
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   363
    private static void toMatchResultTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   364
        Pattern pattern = Pattern.compile("squid");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   365
        Matcher matcher = pattern.matcher(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   366
            "agiantsquidofdestinyasmallsquidoffate");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   367
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   368
        int matcherStart1 = matcher.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   369
        MatchResult mr = matcher.toMatchResult();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   370
        if (mr == matcher)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   371
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   372
        int resultStart1 = mr.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   373
        if (matcherStart1 != resultStart1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   374
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   375
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   376
        int matcherStart2 = matcher.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   377
        int resultStart2 = mr.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   378
        if (matcherStart2 == resultStart2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   379
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   380
        if (resultStart1 != resultStart2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   381
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   382
        MatchResult mr2 = matcher.toMatchResult();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   383
        if (mr == mr2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   384
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   385
        if (mr2.start() != matcherStart2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   386
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   387
        report("toMatchResult is a copy");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   388
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   389
29503
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   390
    private static void checkExpectedISE(Runnable test) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   391
        try {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   392
            test.run();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   393
            failCount++;
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   394
        } catch (IllegalStateException x) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   395
        } catch (IndexOutOfBoundsException xx) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   396
            failCount++;
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   397
        }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   398
    }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   399
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   400
    private static void checkExpectedIOOE(Runnable test) {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   401
        try {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   402
            test.run();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   403
            failCount++;
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   404
        } catch (IndexOutOfBoundsException x) {}
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   405
    }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   406
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   407
    // This is for bug 8074678
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   408
    // Test the result of toMatchResult throws ISE if no match is availble
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   409
    private static void toMatchResultTest2() throws Exception {
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   410
        Matcher matcher = Pattern.compile("nomatch").matcher("hello world");
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   411
        matcher.find();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   412
        MatchResult mr = matcher.toMatchResult();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   413
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   414
        checkExpectedISE(() -> mr.start());
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   415
        checkExpectedISE(() -> mr.start(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   416
        checkExpectedISE(() -> mr.end());
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   417
        checkExpectedISE(() -> mr.end(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   418
        checkExpectedISE(() -> mr.group());
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   419
        checkExpectedISE(() -> mr.group(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   420
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   421
        matcher = Pattern.compile("(match)").matcher("there is a match");
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   422
        matcher.find();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   423
        MatchResult mr2 = matcher.toMatchResult();
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   424
        checkExpectedIOOE(() -> mr2.start(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   425
        checkExpectedIOOE(() -> mr2.end(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   426
        checkExpectedIOOE(() -> mr2.group(2));
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   427
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   428
        report("toMatchResult2 appropriate exceptions");
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   429
    }
95318f222149 8074678: JCK test java_util/regex/MatchResult/index.html starts failing after JDK-8071479
sherman
parents: 29243
diff changeset
   430
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   431
    // This is for bug 5013885
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   432
    // Must test a slice to see if it reports hitEnd correctly
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   433
    private static void hitEndTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   434
        // Basic test of Slice node
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   435
        Pattern p = Pattern.compile("^squidattack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   436
        Matcher m = p.matcher("squack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   437
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   438
        if (m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   439
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   440
        m.reset("squid");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   441
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   442
        if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   443
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   444
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   445
        // Test Slice, SliceA and SliceU nodes
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   446
        for (int i=0; i<3; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   447
            int flags = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   448
            if (i==1) flags = Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   449
            if (i==2) flags = Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   450
            p = Pattern.compile("^abc", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   451
            m = p.matcher("ad");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   452
            m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   453
            if (m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   454
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   455
            m.reset("ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   456
            m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   457
            if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   458
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   459
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   460
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   461
        // Test Boyer-Moore node
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   462
        p = Pattern.compile("catattack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   463
        m = p.matcher("attack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   464
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   465
        if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   466
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   467
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   468
        p = Pattern.compile("catattack");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   469
        m = p.matcher("attackattackattackcatatta");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   470
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   471
        if (!m.hitEnd())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   472
            failCount++;
45888
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   473
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   474
        // 8184706: Matching u+0d at EOL against \R should hit-end
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   475
        p = Pattern.compile("...\\R");
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   476
        m = p.matcher("cat" + (char)0x0a);
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   477
        m.find();
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   478
        if (m.hitEnd())
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   479
            failCount++;
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   480
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   481
        m = p.matcher("cat" + (char)0x0d);
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   482
        m.find();
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   483
        if (!m.hitEnd())
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   484
            failCount++;
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   485
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   486
        m = p.matcher("cat" + (char)0x0d + (char)0x0a);
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   487
        m.find();
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   488
        if (m.hitEnd())
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   489
            failCount++;
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   490
ae448cf92e00 8184706: Matcher doesn't indicate hitEnd after matching \u0D with \R at EOL
igerasim
parents: 45466
diff changeset
   491
        report("hitEnd");
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   492
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   493
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   494
    // This is for bug 4997476
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   495
    // It is weird code submitted by customer demonstrating a regression
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   496
    private static void wordSearchTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   497
        String testString = new String("word1 word2 word3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   498
        Pattern p = Pattern.compile("\\b");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   499
        Matcher m = p.matcher(testString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   500
        int position = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   501
        int start = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   502
        while (m.find(position)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   503
            start = m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   504
            if (start == testString.length())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   505
                break;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   506
            if (m.find(start+1)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   507
                position = m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   508
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   509
                position = testString.length();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   510
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   511
            if (testString.substring(start, position).equals(" "))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   512
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   513
            if (!testString.substring(start, position-1).startsWith("word"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   514
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   515
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   516
        report("Customer word search");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   517
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   518
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   519
    // This is for bug 4994840
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   520
    private static void caretAtEndTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   521
        // Problem only occurs with multiline patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   522
        // containing a beginning-of-line caret "^" followed
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   523
        // by an expression that also matches the empty string.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   524
        Pattern pattern = Pattern.compile("^x?", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   525
        Matcher matcher = pattern.matcher("\r");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   526
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   527
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   528
        report("Caret at end");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   529
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   530
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   531
    // This test is for 4979006
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   532
    // Check to see if word boundary construct properly handles unicode
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   533
    // non spacing marks
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   534
    private static void unicodeWordBoundsTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   535
        String spaces = "  ";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   536
        String wordChar = "a";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   537
        String nsm = "\u030a";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   538
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   539
        assert (Character.getType('\u030a') == Character.NON_SPACING_MARK);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   540
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   541
        Pattern pattern = Pattern.compile("\\b");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   542
        Matcher matcher = pattern.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   543
        // S=other B=word character N=non spacing mark .=word boundary
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   544
        // SS.BB.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   545
        String input = spaces + wordChar + wordChar + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   546
        twoFindIndexes(input, matcher, 2, 4);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   547
        // SS.BBN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   548
        input = spaces + wordChar +wordChar + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   549
        twoFindIndexes(input, matcher, 2, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   550
        // SS.BN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   551
        input = spaces + wordChar + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   552
        twoFindIndexes(input, matcher, 2, 4);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   553
        // SS.BNN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   554
        input = spaces + wordChar + nsm + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   555
        twoFindIndexes(input, matcher, 2, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   556
        // SSN.BB.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   557
        input = spaces + nsm + wordChar + wordChar + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   558
        twoFindIndexes(input, matcher, 3, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   559
        // SS.BNB.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   560
        input = spaces + wordChar + nsm + wordChar + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   561
        twoFindIndexes(input, matcher, 2, 5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   562
        // SSNNSS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   563
        input = spaces + nsm + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   564
        matcher.reset(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   565
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   566
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   567
        // SSN.BBN.SS
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   568
        input = spaces + nsm + wordChar + wordChar + nsm + spaces;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   569
        twoFindIndexes(input, matcher, 3, 6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   570
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   571
        report("Unicode word boundary");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   572
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   573
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   574
    private static void twoFindIndexes(String input, Matcher matcher, int a,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   575
                                       int b) throws Exception
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   576
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   577
        matcher.reset(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   578
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   579
        if (matcher.start() != a)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   580
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   581
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   582
        if (matcher.start() != b)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   583
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   584
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   585
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   586
    // This test is for 6284152
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   587
    static void check(String regex, String input, String[] expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   588
        List<String> result = new ArrayList<String>();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   589
        Pattern p = Pattern.compile(regex);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   590
        Matcher m = p.matcher(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   591
        while (m.find()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   592
            result.add(m.group());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   593
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   594
        if (!Arrays.asList(expected).equals(result))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   595
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   596
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   597
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   598
    private static void lookbehindTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   599
        //Positive
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   600
        check("(?<=%.{0,5})foo\\d",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   601
              "%foo1\n%bar foo2\n%bar  foo3\n%blahblah foo4\nfoo5",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   602
              new String[]{"foo1", "foo2", "foo3"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   603
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   604
        //boundary at end of the lookbehind sub-regex should work consistently
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   605
        //with the boundary just after the lookbehind sub-regex
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   606
        check("(?<=.*\\b)foo", "abcd foo", new String[]{"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   607
        check("(?<=.*)\\bfoo", "abcd foo", new String[]{"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   608
        check("(?<!abc )\\bfoo", "abc foo", new String[0]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   609
        check("(?<!abc \\b)foo", "abc foo", new String[0]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   610
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   611
        //Negative
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   612
        check("(?<!%.{0,5})foo\\d",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   613
              "%foo1\n%bar foo2\n%bar  foo3\n%blahblah foo4\nfoo5",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   614
              new String[] {"foo4", "foo5"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   615
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   616
        //Positive greedy
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   617
        check("(?<=%b{1,4})foo", "%bbbbfoo", new String[] {"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   618
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   619
        //Positive reluctant
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   620
        check("(?<=%b{1,4}?)foo", "%bbbbfoo", new String[] {"foo"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   621
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   622
        //supplementary
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   623
        check("(?<=%b{1,4})fo\ud800\udc00o", "%bbbbfo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   624
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   625
        check("(?<=%b{1,4}?)fo\ud800\udc00o", "%bbbbfo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   626
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   627
        check("(?<!%b{1,4})fo\ud800\udc00o", "%afo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   628
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   629
        check("(?<!%b{1,4}?)fo\ud800\udc00o", "%afo\ud800\udc00o",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   630
              new String[] {"fo\ud800\udc00o"});
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   631
        report("Lookbehind");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   632
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   633
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   634
    // This test is for 4938995
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   635
    // Check to see if weak region boundaries are transparent to
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   636
    // lookahead and lookbehind constructs
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   637
    private static void boundsTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   638
        String fullMessage = "catdogcat";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   639
        Pattern pattern = Pattern.compile("(?<=cat)dog(?=cat)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   640
        Matcher matcher = pattern.matcher("catdogca");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   641
        matcher.useTransparentBounds(true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   642
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   643
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   644
        matcher.reset("atdogcat");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   645
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   646
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   647
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   648
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   649
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   650
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   651
        matcher.region(0,9);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   652
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   653
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   654
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   655
        matcher.region(0,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   656
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   657
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   658
        matcher.reset(fullMessage);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   659
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   660
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   661
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   662
        matcher.useTransparentBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   663
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   664
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   665
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   666
        // Negative lookahead/lookbehind
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   667
        pattern = Pattern.compile("(?<!cat)dog(?!cat)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   668
        matcher = pattern.matcher("dogcat");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   669
        matcher.useTransparentBounds(true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   670
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   671
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   672
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   673
        matcher.reset("catdog");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   674
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   675
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   676
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   677
        matcher.useTransparentBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   678
        matcher.reset("dogcat");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   679
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   680
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   681
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   682
        matcher.reset("catdog");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   683
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   684
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   685
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   686
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   687
        report("Region bounds transparency");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   688
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   689
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   690
    // This test is for 4945394
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   691
    private static void findFromTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   692
        String message = "This is 40 $0 message.";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   693
        Pattern pat = Pattern.compile("\\$0");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   694
        Matcher match = pat.matcher(message);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   695
        if (!match.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   696
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   697
        if (match.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   698
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   699
        if (match.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   700
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   701
        report("Check for alternating find");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   702
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   703
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   704
    // This test is for 4872664 and 4892980
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   705
    private static void negatedCharClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   706
        Pattern pattern = Pattern.compile("[^>]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   707
        Matcher matcher = pattern.matcher("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   708
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   709
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   710
        pattern = Pattern.compile("[^fr]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   711
        matcher = pattern.matcher("a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   712
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   713
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   714
        matcher.reset("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   715
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   716
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   717
        String s = "for";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   718
        String result[] = s.split("[^fr]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   719
        if (!result[0].equals("f"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   720
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   721
        if (!result[1].equals("r"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   722
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   723
        s = "f\u203Ar";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   724
        result = s.split("[^fr]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   725
        if (!result[0].equals("f"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   726
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   727
        if (!result[1].equals("r"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   728
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   729
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   730
        // Test adding to bits, subtracting a node, then adding to bits again
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   731
        pattern = Pattern.compile("[^f\u203Ar]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   732
        matcher = pattern.matcher("a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   733
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   734
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   735
        matcher.reset("f");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   736
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   737
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   738
        matcher.reset("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   739
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   740
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   741
        matcher.reset("r");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   742
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   743
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   744
        matcher.reset("\u203B");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   745
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   746
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   747
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   748
        // Test subtracting a node, adding to bits, subtracting again
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   749
        pattern = Pattern.compile("[^\u203Ar\u203B]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   750
        matcher = pattern.matcher("a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   751
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   752
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   753
        matcher.reset("\u203A");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   754
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   755
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   756
        matcher.reset("r");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   757
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   758
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   759
        matcher.reset("\u203B");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   760
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   761
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   762
        matcher.reset("\u203C");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   763
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   764
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   765
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   766
        report("Negated Character Class");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   767
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   768
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   769
    // This test is for 4628291
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   770
    private static void toStringTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   771
        Pattern pattern = Pattern.compile("b+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   772
        if (pattern.toString() != "b+")
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   773
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   774
        Matcher matcher = pattern.matcher("aaabbbccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   775
        String matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   776
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   777
        matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   778
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   779
        matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   780
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   781
        matcherString = matcher.toString(); // unspecified
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   782
        report("toString");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   783
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   784
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   785
    // This test is for 4808962
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   786
    private static void literalPatternTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   787
        int flags = Pattern.LITERAL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   788
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   789
        Pattern pattern = Pattern.compile("abc\\t$^", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   790
        check(pattern, "abc\\t$^", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   791
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   792
        pattern = Pattern.compile(Pattern.quote("abc\\t$^"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   793
        check(pattern, "abc\\t$^", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   794
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   795
        pattern = Pattern.compile("\\Qa^$bcabc\\E", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   796
        check(pattern, "\\Qa^$bcabc\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   797
        check(pattern, "a^$bcabc", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   798
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   799
        pattern = Pattern.compile("\\\\Q\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   800
        check(pattern, "\\Q\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   801
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   802
        pattern = Pattern.compile("\\Qabc\\Eefg\\\\Q\\\\Ehij");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   803
        check(pattern, "abcefg\\Q\\Ehij", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   804
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   805
        pattern = Pattern.compile("\\\\\\Q\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   806
        check(pattern, "\\\\\\\\", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   807
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   808
        pattern = Pattern.compile(Pattern.quote("\\Qa^$bcabc\\E"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   809
        check(pattern, "\\Qa^$bcabc\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   810
        check(pattern, "a^$bcabc", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   811
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   812
        pattern = Pattern.compile(Pattern.quote("\\Qabc\\Edef"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   813
        check(pattern, "\\Qabc\\Edef", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   814
        check(pattern, "abcdef", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   815
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   816
        pattern = Pattern.compile(Pattern.quote("abc\\Edef"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   817
        check(pattern, "abc\\Edef", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   818
        check(pattern, "abcdef", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   819
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   820
        pattern = Pattern.compile(Pattern.quote("\\E"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   821
        check(pattern, "\\E", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   822
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   823
        pattern = Pattern.compile("((((abc.+?:)", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   824
        check(pattern, "((((abc.+?:)", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   825
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   826
        flags |= Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   827
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   828
        pattern = Pattern.compile("^cat$", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   829
        check(pattern, "abc^cat$def", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   830
        check(pattern, "cat", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   831
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   832
        flags |= Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   833
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   834
        pattern = Pattern.compile("abcdef", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   835
        check(pattern, "ABCDEF", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   836
        check(pattern, "AbCdEf", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   837
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   838
        flags |= Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   839
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   840
        pattern = Pattern.compile("a...b", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   841
        check(pattern, "A...b", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   842
        check(pattern, "Axxxb", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   843
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   844
        flags |= Pattern.CANON_EQ;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   845
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   846
        Pattern p = Pattern.compile("testa\u030a", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   847
        check(pattern, "testa\u030a", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   848
        check(pattern, "test\u00e5", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   849
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   850
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   851
        flags = Pattern.LITERAL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   852
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   853
        pattern = Pattern.compile(toSupplementaries("abc\\t$^"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   854
        check(pattern, toSupplementaries("abc\\t$^"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   855
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   856
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("abc\\t$^")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   857
        check(pattern, toSupplementaries("abc\\t$^"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   858
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   859
        pattern = Pattern.compile(toSupplementaries("\\Qa^$bcabc\\E"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   860
        check(pattern, toSupplementaries("\\Qa^$bcabc\\E"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   861
        check(pattern, toSupplementaries("a^$bcabc"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   862
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   863
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("\\Qa^$bcabc\\E")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   864
        check(pattern, toSupplementaries("\\Qa^$bcabc\\E"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   865
        check(pattern, toSupplementaries("a^$bcabc"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   866
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   867
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("\\Qabc\\Edef")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   868
        check(pattern, toSupplementaries("\\Qabc\\Edef"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   869
        check(pattern, toSupplementaries("abcdef"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   870
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   871
        pattern = Pattern.compile(Pattern.quote(toSupplementaries("abc\\Edef")));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   872
        check(pattern, toSupplementaries("abc\\Edef"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   873
        check(pattern, toSupplementaries("abcdef"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   874
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   875
        pattern = Pattern.compile(toSupplementaries("((((abc.+?:)"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   876
        check(pattern, toSupplementaries("((((abc.+?:)"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   877
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   878
        flags |= Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   879
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   880
        pattern = Pattern.compile(toSupplementaries("^cat$"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   881
        check(pattern, toSupplementaries("abc^cat$def"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   882
        check(pattern, toSupplementaries("cat"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   883
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   884
        flags |= Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   885
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   886
        // note: this is case-sensitive.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   887
        pattern = Pattern.compile(toSupplementaries("a...b"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   888
        check(pattern, toSupplementaries("a...b"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   889
        check(pattern, toSupplementaries("axxxb"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   890
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   891
        flags |= Pattern.CANON_EQ;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   892
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   893
        String t = toSupplementaries("test");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   894
        p = Pattern.compile(t + "a\u030a", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   895
        check(pattern, t + "a\u030a", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   896
        check(pattern, t + "\u00e5", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   897
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   898
        report("Literal pattern");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   899
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   900
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   901
    // This test is for 4803179
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   902
    // This test is also for 4808962, replacement parts
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   903
    private static void literalReplacementTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   904
        int flags = Pattern.LITERAL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   905
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   906
        Pattern pattern = Pattern.compile("abc", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   907
        Matcher matcher = pattern.matcher("zzzabczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   908
        String replaceTest = "$0";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   909
        String result = matcher.replaceAll(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   910
        if (!result.equals("zzzabczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   911
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   912
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   913
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   914
        String literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   915
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   916
        if (!result.equals("zzz$0zzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   917
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   918
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   919
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   920
        replaceTest = "\\t$\\$";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   921
        literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   922
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   923
        if (!result.equals("zzz\\t$\\$zzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   924
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   925
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   926
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   927
        pattern = Pattern.compile(toSupplementaries("abc"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   928
        matcher = pattern.matcher(toSupplementaries("zzzabczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   929
        replaceTest = "$0";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   930
        result = matcher.replaceAll(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   931
        if (!result.equals(toSupplementaries("zzzabczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   932
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   933
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   934
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   935
        literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   936
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   937
        if (!result.equals(toSupplementaries("zzz$0zzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   938
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   939
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   940
        matcher.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   941
        replaceTest = "\\t$\\$";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   942
        literalReplacement = matcher.quoteReplacement(replaceTest);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   943
        result = matcher.replaceAll(literalReplacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   944
        if (!result.equals(toSupplementaries("zzz\\t$\\$zzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   945
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   946
12432
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   947
        // IAE should be thrown if backslash or '$' is the last character
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   948
        // in replacement string
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   949
        try {
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   950
            "\uac00".replaceAll("\uac00", "$");
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   951
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   952
        } catch (IllegalArgumentException iie) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   953
        } catch (Exception e) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   954
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   955
        }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
   956
        try {
12432
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   957
            "\uac00".replaceAll("\uac00", "\\");
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   958
            failCount++;
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   959
        } catch (IllegalArgumentException iie) {
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   960
        } catch (Exception e) {
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   961
            failCount++;
748fcaa0e0c1 7067045: replaceAll("\u20ac", "$"); causses java.lang.StringIndexOutOfBoundsExceptio
sherman
parents: 11287
diff changeset
   962
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   963
        report("Literal replacement");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   964
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   965
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   966
    // This test is for 4757029
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   967
    private static void regionTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   968
        Pattern pattern = Pattern.compile("abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   969
        Matcher matcher = pattern.matcher("abcdefabc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   970
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   971
        matcher.region(0,9);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   972
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   973
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   974
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   975
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   976
        matcher.region(0,3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   977
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   978
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   979
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   980
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   981
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   982
        matcher.region(0,2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   983
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   984
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   985
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   986
        expectRegionFail(matcher, 1, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   987
        expectRegionFail(matcher, -1, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   988
        expectRegionFail(matcher, -1, 1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   989
        expectRegionFail(matcher, 5, 3);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   990
        expectRegionFail(matcher, 5, 12);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   991
        expectRegionFail(matcher, 12, 12);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   992
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   993
        pattern = Pattern.compile("^abc$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   994
        matcher = pattern.matcher("zzzabczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   995
        matcher.region(0,9);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   996
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   997
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   998
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
   999
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1000
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1001
        matcher.region(3,6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1002
        matcher.useAnchoringBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1003
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1004
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1005
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1006
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1007
        pattern = Pattern.compile(toSupplementaries("abc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1008
        matcher = pattern.matcher(toSupplementaries("abcdefabc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1009
        matcher.region(0,9*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1010
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1011
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1012
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1013
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1014
        matcher.region(0,3*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1015
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1016
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1017
        matcher.region(1,3*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1018
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1019
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1020
        matcher.region(3*2,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1021
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1022
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1023
        matcher.region(0,2*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1024
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1025
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1026
        matcher.region(0,2*2+1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1027
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1028
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1029
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1030
        expectRegionFail(matcher, 1*2, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1031
        expectRegionFail(matcher, -1, -1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1032
        expectRegionFail(matcher, -1, 1*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1033
        expectRegionFail(matcher, 5*2, 3*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1034
        expectRegionFail(matcher, 5*2, 12*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1035
        expectRegionFail(matcher, 12*2, 12*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1036
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1037
        pattern = Pattern.compile(toSupplementaries("^abc$"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1038
        matcher = pattern.matcher(toSupplementaries("zzzabczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1039
        matcher.region(0,9*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1040
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1041
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1042
        matcher.region(3*2,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1043
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1044
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1045
        matcher.region(3*2+1,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1046
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1047
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1048
        matcher.region(3*2,6*2-1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1049
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1050
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1051
        matcher.region(3*2,6*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1052
        matcher.useAnchoringBounds(false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1053
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1054
           failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1055
        report("Regions");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1056
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1057
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1058
    private static void expectRegionFail(Matcher matcher, int index1,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1059
                                         int index2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1060
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1061
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1062
            matcher.region(index1, index2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1063
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1064
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1065
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1066
        } catch (IllegalStateException ise) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1067
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1068
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1069
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1071
    // This test is for 4803197
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1072
    private static void escapedSegmentTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1073
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1074
        Pattern pattern = Pattern.compile("\\Qdir1\\dir2\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1075
        check(pattern, "dir1\\dir2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1076
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1077
        pattern = Pattern.compile("\\Qdir1\\dir2\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1078
        check(pattern, "dir1\\dir2\\", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1079
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1080
        pattern = Pattern.compile("(\\Qdir1\\dir2\\\\E)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1081
        check(pattern, "dir1\\dir2\\", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1082
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1083
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1084
        pattern = Pattern.compile(toSupplementaries("\\Qdir1\\dir2\\E"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1085
        check(pattern, toSupplementaries("dir1\\dir2"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1086
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1087
        pattern = Pattern.compile(toSupplementaries("\\Qdir1\\dir2")+"\\\\E");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1088
        check(pattern, toSupplementaries("dir1\\dir2\\"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1089
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1090
        pattern = Pattern.compile(toSupplementaries("(\\Qdir1\\dir2")+"\\\\E)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1091
        check(pattern, toSupplementaries("dir1\\dir2\\"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1092
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1093
        report("Escaped segment");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1094
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1095
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1096
    // This test is for 4792284
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1097
    private static void nonCaptureRepetitionTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1098
        String input = "abcdefgh;";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1099
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1100
        String[] patterns = new String[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1101
            "(?:\\w{4})+;",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1102
            "(?:\\w{8})*;",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1103
            "(?:\\w{2}){2,4};",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1104
            "(?:\\w{4}){2,};",   // only matches the
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1105
            ".*?(?:\\w{5})+;",   //     specified minimum
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1106
            ".*?(?:\\w{9})*;",   //     number of reps - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1107
            "(?:\\w{4})+?;",     // lazy repetition - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1108
            "(?:\\w{4})++;",     // possessive repetition - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1109
            "(?:\\w{2,}?)+;",    // non-deterministic - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1110
            "(\\w{4})+;",        // capturing group - OK
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1111
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1112
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1113
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1114
            // Check find()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1115
            check(patterns[i], 0, input, input, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1116
            // Check matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1117
            Pattern p = Pattern.compile(patterns[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1118
            Matcher m = p.matcher(input);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1119
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1120
            if (m.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1121
                if (!m.group(0).equals(input))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1122
                    failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1123
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1124
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1125
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1126
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1127
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1128
        report("Non capturing repetition");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1129
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1131
    // This test is for 6358731
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1132
    private static void notCapturedGroupCurlyMatchTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1133
        Pattern pattern = Pattern.compile("(abc)+|(abcd)+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1134
        Matcher matcher = pattern.matcher("abcd");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1135
        if (!matcher.matches() ||
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1136
             matcher.group(1) != null ||
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1137
             !matcher.group(2).equals("abcd")) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1138
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1139
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1140
        report("Not captured GroupCurly");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1141
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1142
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1143
    // This test is for 4706545
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1144
    private static void javaCharClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1145
        for (int i=0; i<1000; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1146
            char c = (char)generator.nextInt();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1147
            check("{javaLowerCase}", c, Character.isLowerCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1148
            check("{javaUpperCase}", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1149
            check("{javaUpperCase}+", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1150
            check("{javaTitleCase}", c, Character.isTitleCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1151
            check("{javaDigit}", c, Character.isDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1152
            check("{javaDefined}", c, Character.isDefined(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1153
            check("{javaLetter}", c, Character.isLetter(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1154
            check("{javaLetterOrDigit}", c, Character.isLetterOrDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1155
            check("{javaJavaIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1156
                  Character.isJavaIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1157
            check("{javaJavaIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1158
                  Character.isJavaIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1159
            check("{javaUnicodeIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1160
                  Character.isUnicodeIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1161
            check("{javaUnicodeIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1162
                  Character.isUnicodeIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1163
            check("{javaIdentifierIgnorable}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1164
                  Character.isIdentifierIgnorable(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1165
            check("{javaSpaceChar}", c, Character.isSpaceChar(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1166
            check("{javaWhitespace}", c, Character.isWhitespace(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1167
            check("{javaISOControl}", c, Character.isISOControl(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1168
            check("{javaMirrored}", c, Character.isMirrored(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1169
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1170
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1171
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1172
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1173
        for (int i=0; i<1000; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1174
            int c = generator.nextInt(Character.MAX_CODE_POINT
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1175
                                      - Character.MIN_SUPPLEMENTARY_CODE_POINT)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1176
                        + Character.MIN_SUPPLEMENTARY_CODE_POINT;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1177
            check("{javaLowerCase}", c, Character.isLowerCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1178
            check("{javaUpperCase}", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1179
            check("{javaUpperCase}+", c, Character.isUpperCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1180
            check("{javaTitleCase}", c, Character.isTitleCase(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1181
            check("{javaDigit}", c, Character.isDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1182
            check("{javaDefined}", c, Character.isDefined(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1183
            check("{javaLetter}", c, Character.isLetter(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1184
            check("{javaLetterOrDigit}", c, Character.isLetterOrDigit(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1185
            check("{javaJavaIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1186
                  Character.isJavaIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1187
            check("{javaJavaIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1188
                  Character.isJavaIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1189
            check("{javaUnicodeIdentifierStart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1190
                  Character.isUnicodeIdentifierStart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1191
            check("{javaUnicodeIdentifierPart}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1192
                  Character.isUnicodeIdentifierPart(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1193
            check("{javaIdentifierIgnorable}", c,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1194
                  Character.isIdentifierIgnorable(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1195
            check("{javaSpaceChar}", c, Character.isSpaceChar(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1196
            check("{javaWhitespace}", c, Character.isWhitespace(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1197
            check("{javaISOControl}", c, Character.isISOControl(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1198
            check("{javaMirrored}", c, Character.isMirrored(c));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1199
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1200
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1201
        report("Java character classes");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1202
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1203
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1204
    // This test is for 4523620
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1205
    /*
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1206
    private static void numOccurrencesTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1207
        Pattern pattern = Pattern.compile("aaa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1208
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1209
        if (pattern.numOccurrences("aaaaaa", false) != 2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1210
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1211
        if (pattern.numOccurrences("aaaaaa", true) != 4)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1212
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1213
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1214
        pattern = Pattern.compile("^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1215
        if (pattern.numOccurrences("aaaaaa", false) != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1216
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1217
        if (pattern.numOccurrences("aaaaaa", true) != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1218
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1219
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1220
        report("Number of Occurrences");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1221
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1222
    */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1223
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1224
    // This test is for 4776374
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1225
    private static void caretBetweenTerminatorsTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1226
        int flags1 = Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1227
        int flags2 = Pattern.DOTALL | Pattern.UNIX_LINES;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1228
        int flags3 = Pattern.DOTALL | Pattern.UNIX_LINES | Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1229
        int flags4 = Pattern.DOTALL | Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1230
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1231
        check("^....", flags1, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1232
        check(".....^", flags1, "test\ntest", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1233
        check(".....^", flags1, "test\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1234
        check("....^", flags1, "test\r\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1235
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1236
        check("^....", flags2, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1237
        check("....^", flags2, "test\ntest", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1238
        check(".....^", flags2, "test\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1239
        check("....^", flags2, "test\r\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1240
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1241
        check("^....", flags3, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1242
        check(".....^", flags3, "test\ntest", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1243
        check(".....^", flags3, "test\u0085test", "test\u0085", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1244
        check(".....^", flags3, "test\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1245
        check(".....^", flags3, "test\r\n", "test", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1246
        check("......^", flags3, "test\r\ntest", "test\r\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1247
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1248
        check("^....", flags4, "test\ntest", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1249
        check(".....^", flags3, "test\ntest", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1250
        check(".....^", flags4, "test\u0085test", "test\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1251
        check(".....^", flags4, "test\n", "test\n", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1252
        check(".....^", flags4, "test\r\n", "test\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1253
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1254
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1255
        String t = toSupplementaries("test");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1256
        check("^....", flags1, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1257
        check(".....^", flags1, t+"\n"+t, t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1258
        check(".....^", flags1, t+"\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1259
        check("....^", flags1, t+"\r\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1260
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1261
        check("^....", flags2, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1262
        check("....^", flags2, t+"\n"+t, t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1263
        check(".....^", flags2, t+"\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1264
        check("....^", flags2, t+"\r\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1265
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1266
        check("^....", flags3, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1267
        check(".....^", flags3, t+"\n"+t, t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1268
        check(".....^", flags3, t+"\u0085"+t, t+"\u0085", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1269
        check(".....^", flags3, t+"\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1270
        check(".....^", flags3, t+"\r\n", t, false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1271
        check("......^", flags3, t+"\r\n"+t, t+"\r\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1272
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1273
        check("^....", flags4, t+"\n"+t, t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1274
        check(".....^", flags3, t+"\n"+t, t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1275
        check(".....^", flags4, t+"\u0085"+t, t+"\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1276
        check(".....^", flags4, t+"\n", t+"\n", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1277
        check(".....^", flags4, t+"\r\n", t+"\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1278
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1279
        report("Caret between terminators");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1280
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1281
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1282
    // This test is for 4727935
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1283
    private static void dollarAtEndTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1284
        int flags1 = Pattern.DOTALL;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1285
        int flags2 = Pattern.DOTALL | Pattern.UNIX_LINES;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1286
        int flags3 = Pattern.DOTALL | Pattern.MULTILINE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1287
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1288
        check("....$", flags1, "test\n", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1289
        check("....$", flags1, "test\r\n", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1290
        check(".....$", flags1, "test\n", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1291
        check(".....$", flags1, "test\u0085", "test\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1292
        check("....$", flags1, "test\u0085", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1293
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1294
        check("....$", flags2, "test\n", "test", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1295
        check(".....$", flags2, "test\n", "test\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1296
        check(".....$", flags2, "test\u0085", "test\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1297
        check("....$", flags2, "test\u0085", "est\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1298
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1299
        check("....$.blah", flags3, "test\nblah", "test\nblah", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1300
        check(".....$.blah", flags3, "test\n\nblah", "test\n\nblah", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1301
        check("....$blah", flags3, "test\nblah", "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1302
        check(".....$blah", flags3, "test\nblah", "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1303
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1304
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1305
        String t = toSupplementaries("test");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1306
        String b = toSupplementaries("blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1307
        check("....$", flags1, t+"\n", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1308
        check("....$", flags1, t+"\r\n", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1309
        check(".....$", flags1, t+"\n", t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1310
        check(".....$", flags1, t+"\u0085", t+"\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1311
        check("....$", flags1, t+"\u0085", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1312
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1313
        check("....$", flags2, t+"\n", t, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1314
        check(".....$", flags2, t+"\n", t+"\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1315
        check(".....$", flags2, t+"\u0085", t+"\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1316
        check("....$", flags2, t+"\u0085", toSupplementaries("est\u0085"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1317
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1318
        check("....$."+b, flags3, t+"\n"+b, t+"\n"+b, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1319
        check(".....$."+b, flags3, t+"\n\n"+b, t+"\n\n"+b, true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1320
        check("....$"+b, flags3, t+"\n"+b, "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1321
        check(".....$"+b, flags3, t+"\n"+b, "!!!!", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1322
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1323
        report("Dollar at End");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1324
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1325
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1326
    // This test is for 4711773
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1327
    private static void multilineDollarTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1328
        Pattern findCR = Pattern.compile("$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1329
        Matcher matcher = findCR.matcher("first bit\nsecond bit");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1330
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1331
        if (matcher.start(0) != 9)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1332
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1333
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1334
        if (matcher.start(0) != 20)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1335
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1336
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1337
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1338
        matcher = findCR.matcher(toSupplementaries("first  bit\n second  bit")); // double BMP chars
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1339
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1340
        if (matcher.start(0) != 9*2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1341
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1342
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1343
        if (matcher.start(0) != 20*2)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1344
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1345
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1346
        report("Multiline Dollar");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1347
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1348
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1349
    private static void reluctantRepetitionTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1350
        Pattern p = Pattern.compile("1(\\s\\S+?){1,3}?[\\s,]2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1351
        check(p, "1 word word word 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1352
        check(p, "1 wor wo w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1353
        check(p, "1 word word 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1354
        check(p, "1 word 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1355
        check(p, "1 wo w w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1356
        check(p, "1 wo w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1357
        check(p, "1 wor w 2", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1358
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1359
        p = Pattern.compile("([a-z])+?c");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1360
        Matcher m = p.matcher("ababcdefdec");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1361
        check(m, "ababc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1362
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1363
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1364
        p = Pattern.compile(toSupplementaries("([a-z])+?c"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1365
        m = p.matcher(toSupplementaries("ababcdefdec"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1366
        check(m, toSupplementaries("ababc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1367
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1368
        report("Reluctant Repetition");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1369
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1370
48491
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1371
    private static Pattern serializedPattern(Pattern p) throws Exception {
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1372
        ByteArrayOutputStream baos = new ByteArrayOutputStream();
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1373
        ObjectOutputStream oos = new ObjectOutputStream(baos);
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1374
        oos.writeObject(p);
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1375
        oos.close();
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1376
        try (ObjectInputStream ois = new ObjectInputStream(
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1377
                new ByteArrayInputStream(baos.toByteArray()))) {
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1378
            return (Pattern)ois.readObject();
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1379
        }
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1380
    }
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1381
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1382
    private static void serializeTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1383
        String patternStr = "(b)";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1384
        String matchStr = "b";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1385
        Pattern pattern = Pattern.compile(patternStr);
48491
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1386
        Pattern serializedPattern = serializedPattern(pattern);
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1387
        Matcher matcher = serializedPattern.matcher(matchStr);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1388
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1389
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1390
        if (matcher.groupCount() != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1391
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1392
48491
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1393
        pattern = Pattern.compile("a(?-i)b", Pattern.CASE_INSENSITIVE);
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1394
        serializedPattern = serializedPattern(pattern);
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1395
        if (!serializedPattern.matcher("Ab").matches())
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1396
            failCount++;
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1397
        if (serializedPattern.matcher("AB").matches())
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1398
            failCount++;
7f11a1699ef6 8194667: Regex: Serialization doesn't work with match flags
sherman
parents: 47216
diff changeset
  1399
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1400
        report("Serialization");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1401
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1402
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1403
    private static void gTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1404
        Pattern pattern = Pattern.compile("\\G\\w");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1405
        Matcher matcher = pattern.matcher("abc#x#x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1406
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1407
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1408
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1409
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1410
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1411
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1412
        pattern = Pattern.compile("\\GA*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1413
        matcher = pattern.matcher("1A2AA3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1414
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1415
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1416
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1417
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1418
        pattern = Pattern.compile("\\GA*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1419
        matcher = pattern.matcher("1A2AA3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1420
        if (!matcher.find(1))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1421
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1422
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1423
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1424
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1425
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1426
        report("\\G");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1427
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1428
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1429
    private static void zTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1430
        Pattern pattern = Pattern.compile("foo\\Z");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1431
        // Positives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1432
        check(pattern, "foo\u0085", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1433
        check(pattern, "foo\u2028", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1434
        check(pattern, "foo\u2029", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1435
        check(pattern, "foo\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1436
        check(pattern, "foo\r", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1437
        check(pattern, "foo\r\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1438
        // Negatives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1439
        check(pattern, "fooo", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1440
        check(pattern, "foo\n\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1441
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1442
        pattern = Pattern.compile("foo\\Z", Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1443
        // Positives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1444
        check(pattern, "foo", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1445
        check(pattern, "foo\n", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1446
        // Negatives
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1447
        check(pattern, "foo\r", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1448
        check(pattern, "foo\u0085", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1449
        check(pattern, "foo\u2028", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1450
        check(pattern, "foo\u2029", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1451
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1452
        report("\\Z");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1453
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1454
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1455
    private static void replaceFirstTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1456
        Pattern pattern = Pattern.compile("(ab)(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1457
        Matcher matcher = pattern.matcher("abccczzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1458
        if (!matcher.replaceFirst("test").equals("testzzzabcczzzabccc"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1459
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1460
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1461
        matcher.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1462
        if (!matcher.replaceFirst("test").equals("zzztestzzzabcczzzabccczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1463
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1464
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1465
        matcher.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1466
        String result = matcher.replaceFirst("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1467
        if (!result.equals("zzzabzzzabcczzzabccczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1468
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1469
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1470
        matcher.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1471
        result = matcher.replaceFirst("$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1472
        if (!result.equals("zzzccczzzabcczzzabccczzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1473
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1474
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1475
        pattern = Pattern.compile("a*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1476
        matcher = pattern.matcher("aaaaaaaaaa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1477
        if (!matcher.replaceFirst("test").equals("test"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1478
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1479
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1480
        pattern = Pattern.compile("a+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1481
        matcher = pattern.matcher("zzzaaaaaaaaaa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1482
        if (!matcher.replaceFirst("test").equals("zzztest"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1483
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1484
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1485
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1486
        pattern = Pattern.compile(toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1487
        matcher = pattern.matcher(toSupplementaries("abccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1488
        if (!matcher.replaceFirst(toSupplementaries("test"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1489
                .equals(toSupplementaries("testzzzabcczzzabccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1490
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1491
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1492
        matcher.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1493
        if (!matcher.replaceFirst(toSupplementaries("test")).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1494
            equals(toSupplementaries("zzztestzzzabcczzzabccczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1495
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1496
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1497
        matcher.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1498
        result = matcher.replaceFirst("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1499
        if (!result.equals(toSupplementaries("zzzabzzzabcczzzabccczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1500
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1501
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1502
        matcher.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1503
        result = matcher.replaceFirst("$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1504
        if (!result.equals(toSupplementaries("zzzccczzzabcczzzabccczzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1505
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1506
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1507
        pattern = Pattern.compile(toSupplementaries("a*"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1508
        matcher = pattern.matcher(toSupplementaries("aaaaaaaaaa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1509
        if (!matcher.replaceFirst(toSupplementaries("test")).equals(toSupplementaries("test")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1510
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1511
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1512
        pattern = Pattern.compile(toSupplementaries("a+"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1513
        matcher = pattern.matcher(toSupplementaries("zzzaaaaaaaaaa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1514
        if (!matcher.replaceFirst(toSupplementaries("test")).equals(toSupplementaries("zzztest")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1515
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1516
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1517
        report("Replace First");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1518
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1519
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1520
    private static void unixLinesTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1521
        Pattern pattern = Pattern.compile(".*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1522
        Matcher matcher = pattern.matcher("aa\u2028blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1523
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1524
        if (!matcher.group(0).equals("aa"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1525
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1526
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1527
        pattern = Pattern.compile(".*", Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1528
        matcher = pattern.matcher("aa\u2028blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1529
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1530
        if (!matcher.group(0).equals("aa\u2028blah"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1531
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1532
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1533
        pattern = Pattern.compile("[az]$",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1534
                                  Pattern.MULTILINE | Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1535
        matcher = pattern.matcher("aa\u2028zz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1536
        check(matcher, "a\u2028", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1537
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1538
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1539
        pattern = Pattern.compile(".*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1540
        matcher = pattern.matcher(toSupplementaries("aa\u2028blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1541
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1542
        if (!matcher.group(0).equals(toSupplementaries("aa")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1543
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1544
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1545
        pattern = Pattern.compile(".*", Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1546
        matcher = pattern.matcher(toSupplementaries("aa\u2028blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1547
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1548
        if (!matcher.group(0).equals(toSupplementaries("aa\u2028blah")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1549
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1550
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1551
        pattern = Pattern.compile(toSupplementaries("[az]$"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1552
                                  Pattern.MULTILINE | Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1553
        matcher = pattern.matcher(toSupplementaries("aa\u2028zz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1554
        check(matcher, toSupplementaries("a\u2028"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1555
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1556
        report("Unix Lines");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1557
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1558
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1559
    private static void commentsTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1560
        int flags = Pattern.COMMENTS;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1561
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1562
        Pattern pattern = Pattern.compile("aa \\# aa", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1563
        Matcher matcher = pattern.matcher("aa#aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1564
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1565
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1566
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1567
        pattern = Pattern.compile("aa  # blah", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1568
        matcher = pattern.matcher("aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1569
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1570
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1571
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1572
        pattern = Pattern.compile("aa blah", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1573
        matcher = pattern.matcher("aablah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1574
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1575
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1576
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1577
        pattern = Pattern.compile("aa  # blah blech  ", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1578
        matcher = pattern.matcher("aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1579
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1580
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1581
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1582
        pattern = Pattern.compile("aa  # blah\n  ", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1583
        matcher = pattern.matcher("aa");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1584
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1585
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1586
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1587
        pattern = Pattern.compile("aa  # blah\nbc # blech", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1588
        matcher = pattern.matcher("aabc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1589
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1590
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1591
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1592
        pattern = Pattern.compile("aa  # blah\nbc# blech", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1593
        matcher = pattern.matcher("aabc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1594
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1595
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1596
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1597
        pattern = Pattern.compile("aa  # blah\nbc\\# blech", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1598
        matcher = pattern.matcher("aabc#blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1599
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1600
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1601
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1602
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1603
        pattern = Pattern.compile(toSupplementaries("aa \\# aa"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1604
        matcher = pattern.matcher(toSupplementaries("aa#aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1605
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1606
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1607
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1608
        pattern = Pattern.compile(toSupplementaries("aa  # blah"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1609
        matcher = pattern.matcher(toSupplementaries("aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1610
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1611
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1612
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1613
        pattern = Pattern.compile(toSupplementaries("aa blah"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1614
        matcher = pattern.matcher(toSupplementaries("aablah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1615
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1616
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1617
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1618
        pattern = Pattern.compile(toSupplementaries("aa  # blah blech  "), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1619
        matcher = pattern.matcher(toSupplementaries("aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1620
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1621
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1622
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1623
        pattern = Pattern.compile(toSupplementaries("aa  # blah\n  "), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1624
        matcher = pattern.matcher(toSupplementaries("aa"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1625
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1626
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1627
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1628
        pattern = Pattern.compile(toSupplementaries("aa  # blah\nbc # blech"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1629
        matcher = pattern.matcher(toSupplementaries("aabc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1630
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1631
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1632
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1633
        pattern = Pattern.compile(toSupplementaries("aa  # blah\nbc# blech"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1634
        matcher = pattern.matcher(toSupplementaries("aabc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1635
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1636
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1637
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1638
        pattern = Pattern.compile(toSupplementaries("aa  # blah\nbc\\# blech"), flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1639
        matcher = pattern.matcher(toSupplementaries("aabc#blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1640
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1641
             failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1642
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1643
        report("Comments");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1644
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1645
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1646
    private static void caseFoldingTest() { // bug 4504687
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1647
        int flags = Pattern.CASE_INSENSITIVE | Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1648
        Pattern pattern = Pattern.compile("aa", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1649
        Matcher matcher = pattern.matcher("ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1650
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1651
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1652
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1653
        pattern = Pattern.compile("aA", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1654
        matcher = pattern.matcher("ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1655
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1656
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1657
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1658
        pattern = Pattern.compile("aa", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1659
        matcher = pattern.matcher("aB");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1660
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1661
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1662
        matcher = pattern.matcher("Ab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1663
        if (matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1664
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1665
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1666
        // ASCII               "a"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1667
        // Latin-1 Supplement  "a" + grave
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1668
        // Cyrillic            "a"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1669
        String[] patterns = new String[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1670
            //single
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1671
            "a", "\u00e0", "\u0430",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1672
            //slice
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1673
            "ab", "\u00e0\u00e1", "\u0430\u0431",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1674
            //class single
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1675
            "[a]", "[\u00e0]", "[\u0430]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1676
            //class range
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1677
            "[a-b]", "[\u00e0-\u00e5]", "[\u0430-\u0431]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1678
            //back reference
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1679
            "(a)\\1", "(\u00e0)\\1", "(\u0430)\\1"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1680
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1681
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1682
        String[] texts = new String[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1683
            "A", "\u00c0", "\u0410",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1684
            "AB", "\u00c0\u00c1", "\u0410\u0411",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1685
            "A", "\u00c0", "\u0410",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1686
            "B", "\u00c2", "\u0411",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1687
            "aA", "\u00e0\u00c0", "\u0430\u0410"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1688
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1689
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1690
        boolean[] expected = new boolean[] {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1691
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1692
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1693
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1694
            true, false, false,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1695
            true, false, false
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1696
        };
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1697
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1698
        flags = Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1699
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1700
            pattern = Pattern.compile(patterns[i], flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1701
            matcher = pattern.matcher(texts[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1702
            if (matcher.matches() != expected[i]) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1703
                System.out.println("<1> Failed at " + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1704
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1705
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1706
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1707
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1708
        flags = Pattern.CASE_INSENSITIVE | Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1709
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1710
            pattern = Pattern.compile(patterns[i], flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1711
            matcher = pattern.matcher(texts[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1712
            if (!matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1713
                System.out.println("<2> Failed at " + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1714
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1715
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1716
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1717
        // flag unicode_case alone should do nothing
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1718
        flags = Pattern.UNICODE_CASE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1719
        for (int i = 0; i < patterns.length; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1720
            pattern = Pattern.compile(patterns[i], flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1721
            matcher = pattern.matcher(texts[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1722
            if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1723
                System.out.println("<3> Failed at " + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1724
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1725
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1726
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1727
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1728
        // Special cases: i, I, u+0131 and u+0130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1729
        flags = Pattern.UNICODE_CASE | Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1730
        pattern = Pattern.compile("[h-j]+", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1731
        if (!pattern.matcher("\u0131\u0130").matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1732
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1733
        report("Case Folding");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1734
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1735
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1736
    private static void appendTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1737
        Pattern pattern = Pattern.compile("(ab)(cd)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1738
        Matcher matcher = pattern.matcher("abcd");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1739
        String result = matcher.replaceAll("$2$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1740
        if (!result.equals("cdab"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1741
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1742
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1743
        String  s1 = "Swap all: first = 123, second = 456";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1744
        String  s2 = "Swap one: first = 123, second = 456";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1745
        String  r  = "$3$2$1";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1746
        pattern = Pattern.compile("([a-z]+)( *= *)([0-9]+)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1747
        matcher = pattern.matcher(s1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1748
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1749
        result = matcher.replaceAll(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1750
        if (!result.equals("Swap all: 123 = first, 456 = second"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1751
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1752
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1753
        matcher = pattern.matcher(s2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1754
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1755
        if (matcher.find()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1756
            StringBuffer sb = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1757
            matcher.appendReplacement(sb, r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1758
            matcher.appendTail(sb);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1759
            result = sb.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1760
            if (!result.equals("Swap one: 123 = first, second = 456"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1761
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1762
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1763
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1764
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1765
        pattern = Pattern.compile(toSupplementaries("(ab)(cd)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1766
        matcher = pattern.matcher(toSupplementaries("abcd"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1767
        result = matcher.replaceAll("$2$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1768
        if (!result.equals(toSupplementaries("cdab")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1769
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1770
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1771
        s1 = toSupplementaries("Swap all: first = 123, second = 456");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1772
        s2 = toSupplementaries("Swap one: first = 123, second = 456");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1773
        r  = toSupplementaries("$3$2$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1774
        pattern = Pattern.compile(toSupplementaries("([a-z]+)( *= *)([0-9]+)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1775
        matcher = pattern.matcher(s1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1776
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1777
        result = matcher.replaceAll(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1778
        if (!result.equals(toSupplementaries("Swap all: 123 = first, 456 = second")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1779
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1780
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1781
        matcher = pattern.matcher(s2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1782
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1783
        if (matcher.find()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1784
            StringBuffer sb = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1785
            matcher.appendReplacement(sb, r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1786
            matcher.appendTail(sb);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1787
            result = sb.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1788
            if (!result.equals(toSupplementaries("Swap one: 123 = first, second = 456")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1789
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1790
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1791
        report("Append");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1792
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1793
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1794
    private static void splitTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1795
        Pattern pattern = Pattern.compile(":");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1796
        String[] result = pattern.split("foo:and:boo", 2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1797
        if (!result[0].equals("foo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1798
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1799
        if (!result[1].equals("and:boo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1800
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1801
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1802
        Pattern patternX = Pattern.compile(toSupplementaries("X"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1803
        result = patternX.split(toSupplementaries("fooXandXboo"), 2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1804
        if (!result[0].equals(toSupplementaries("foo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1805
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1806
        if (!result[1].equals(toSupplementaries("andXboo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1807
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1808
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1809
        CharBuffer cb = CharBuffer.allocate(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1810
        cb.put("foo:and:boo");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1811
        cb.flip();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1812
        result = pattern.split(cb);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1813
        if (!result[0].equals("foo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1814
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1815
        if (!result[1].equals("and"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1816
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1817
        if (!result[2].equals("boo"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1818
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1819
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1820
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1821
        CharBuffer cbs = CharBuffer.allocate(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1822
        cbs.put(toSupplementaries("fooXandXboo"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1823
        cbs.flip();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1824
        result = patternX.split(cbs);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1825
        if (!result[0].equals(toSupplementaries("foo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1826
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1827
        if (!result[1].equals(toSupplementaries("and")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1828
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1829
        if (!result[2].equals(toSupplementaries("boo")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1830
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1831
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1832
        String source = "0123456789";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1833
        for (int limit=-2; limit<3; limit++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1834
            for (int x=0; x<10; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1835
                result = source.split(Integer.toString(x), limit);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1836
                int expectedLength = limit < 1 ? 2 : limit;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1837
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1838
                if ((limit == 0) && (x == 9)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1839
                    // expected dropping of ""
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1840
                    if (result.length != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1841
                        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1842
                    if (!result[0].equals("012345678")) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1843
                        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1844
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1845
                } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1846
                    if (result.length != expectedLength) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1847
                        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1848
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1849
                    if (!result[0].equals(source.substring(0,x))) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1850
                        if (limit != 1) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1851
                            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1852
                        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1853
                            if (!result[0].equals(source.substring(0,10))) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1854
                                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1855
                            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1856
                        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1857
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1858
                    if (expectedLength > 1) { // Check segment 2
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1859
                        if (!result[1].equals(source.substring(x+1,10)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1860
                            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1861
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1862
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1863
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1864
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1865
        // Check the case for no match found
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1866
        for (int limit=-2; limit<3; limit++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1867
            result = source.split("e", limit);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1868
            if (result.length != 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1869
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1870
            if (!result[0].equals(source))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1871
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1872
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1873
        // Check the case for limit == 0, source = "";
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1874
        // split() now returns 0-length for empty source "" see #6559590
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1875
        source = "";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1876
        result = source.split("e", 0);
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1877
        if (result.length != 1)
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1878
            failCount++;
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1879
        if (!result[0].equals(source))
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1880
            failCount++;
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1881
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1882
        // Check both split() and splitAsStraem(), especially for zero-lenth
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1883
        // input and zero-lenth match cases
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1884
        String[][] input = new String[][] {
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1885
            { " ",           "Abc Efg Hij" },   // normal non-zero-match
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1886
            { " ",           " Abc Efg Hij" },  // leading empty str for non-zero-match
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1887
            { " ",           "Abc  Efg Hij" },  // non-zero-match in the middle
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1888
            { "(?=\\p{Lu})", "AbcEfgHij" },     // no leading empty str for zero-match
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1889
            { "(?=\\p{Lu})", "AbcEfg" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1890
            { "(?=\\p{Lu})", "Abc" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1891
            { " ",           "" },              // zero-length input
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1892
            { ".*",          "" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1893
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1894
            // some tests from PatternStreamTest.java
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1895
            { "4",       "awgqwefg1fefw4vssv1vvv1" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1896
            { "\u00a3a", "afbfq\u00a3abgwgb\u00a3awngnwggw\u00a3a\u00a3ahjrnhneerh" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1897
            { "1",       "awgqwefg1fefw4vssv1vvv1" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1898
            { "1",       "a\u4ebafg1fefw\u4eba4\u9f9cvssv\u9f9c1v\u672c\u672cvv" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1899
            { "\u56da",  "1\u56da23\u56da456\u56da7890" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1900
            { "\u56da",  "1\u56da23\u9f9c\u672c\u672c\u56da456\u56da\u9f9c\u672c7890" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1901
            { "\u56da",  "" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1902
            { "[ \t,:.]","This is,testing: with\tdifferent separators." }, //multiple septs
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1903
            { "o",       "boo:and:foo" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1904
            { "o",       "booooo:and:fooooo" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1905
            { "o",       "fooooo:" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1906
        };
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1907
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1908
        String[][] expected = new String[][] {
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1909
            { "Abc", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1910
            { "", "Abc", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1911
            { "Abc", "", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1912
            { "Abc", "Efg", "Hij" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1913
            { "Abc", "Efg" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1914
            { "Abc" },
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1915
            { "" },
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1916
            { "" },
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1917
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1918
            { "awgqwefg1fefw", "vssv1vvv1" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1919
            { "afbfq", "bgwgb", "wngnwggw", "", "hjrnhneerh" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1920
            { "awgqwefg", "fefw4vssv", "vvv" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1921
            { "a\u4ebafg", "fefw\u4eba4\u9f9cvssv\u9f9c", "v\u672c\u672cvv" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1922
            { "1", "23", "456", "7890" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1923
            { "1", "23\u9f9c\u672c\u672c", "456", "\u9f9c\u672c7890" },
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1924
            { "" },
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1925
            { "This", "is", "testing", "", "with", "different", "separators" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1926
            { "b", "", ":and:f" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1927
            { "b", "", "", "", "", ":and:f" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1928
            { "f", "", "", "", "", ":" },
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1929
        };
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1930
        for (int i = 0; i < input.length; i++) {
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1931
            pattern = Pattern.compile(input[i][0]);
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1932
            if (!Arrays.equals(pattern.split(input[i][1]), expected[i])) {
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1933
                failCount++;
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1934
            }
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1935
            if (input[i][1].length() > 0 &&  // splitAsStream() return empty resulting
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1936
                                             // array for zero-length input for now
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1937
                !Arrays.equals(pattern.splitAsStream(input[i][1]).toArray(),
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1938
                               expected[i])) {
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1939
                failCount++;
21670
ca3553133ede 8028321: Fix for String.split() empty input sequence/JDK-6559590 triggers regression
sherman
parents: 21668
diff changeset
  1940
            }
21668
b62ce4a9635f 8027645: Pattern.split() with positive lookahead
sherman
parents: 19604
diff changeset
  1941
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1942
        report("Split");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1943
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1944
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1945
    private static void negationTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1946
        Pattern pattern = Pattern.compile("[\\[@^]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1947
        Matcher matcher = pattern.matcher("@@@@[[[[^^^^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1948
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1949
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1950
        if (!matcher.group(0).equals("@@@@[[[[^^^^"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1951
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1952
        pattern = Pattern.compile("[@\\[^]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1953
        matcher = pattern.matcher("@@@@[[[[^^^^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1954
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1955
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1956
        if (!matcher.group(0).equals("@@@@[[[[^^^^"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1957
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1958
        pattern = Pattern.compile("[@\\[^@]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1959
        matcher = pattern.matcher("@@@@[[[[^^^^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1960
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1961
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1962
        if (!matcher.group(0).equals("@@@@[[[[^^^^"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1963
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1964
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1965
        pattern = Pattern.compile("\\)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1966
        matcher = pattern.matcher("xxx)xxx");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1967
        if (!matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1968
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1969
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1970
        report("Negation");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1971
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1972
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1973
    private static void ampersandTest() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1974
        Pattern pattern = Pattern.compile("[&@]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1975
        check(pattern, "@@@@&&&&", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1976
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1977
        pattern = Pattern.compile("[@&]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1978
        check(pattern, "@@@@&&&&", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1979
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1980
        pattern = Pattern.compile("[@\\&]+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1981
        check(pattern, "@@@@&&&&", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1982
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1983
        report("Ampersand");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1984
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1985
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1986
    private static void octalTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1987
        Pattern pattern = Pattern.compile("\\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1988
        Matcher matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1989
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1990
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1991
        pattern = Pattern.compile("\\07");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1992
        matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1993
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1994
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1995
        pattern = Pattern.compile("\\007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1996
        matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1997
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1998
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  1999
        pattern = Pattern.compile("\\0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2000
        matcher = pattern.matcher("\u0007");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2001
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2002
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2003
        pattern = Pattern.compile("\\040");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2004
        matcher = pattern.matcher("\u0020");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2005
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2006
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2007
        pattern = Pattern.compile("\\0403");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2008
        matcher = pattern.matcher("\u00203");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2009
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2010
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2011
        pattern = Pattern.compile("\\0103");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2012
        matcher = pattern.matcher("\u0043");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2013
        if (!matcher.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2014
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2015
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2016
        report("Octal");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2017
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2018
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2019
    private static void longPatternTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2020
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2021
            Pattern pattern = Pattern.compile(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2022
                "a 32-character-long pattern xxxx");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2023
            pattern = Pattern.compile("a 33-character-long pattern xxxxx");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2024
            pattern = Pattern.compile("a thirty four character long regex");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2025
            StringBuffer patternToBe = new StringBuffer(101);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2026
            for (int i=0; i<100; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2027
                patternToBe.append((char)(97 + i%26));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2028
            pattern = Pattern.compile(patternToBe.toString());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2029
        } catch (PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2030
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2031
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2032
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2033
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2034
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2035
            Pattern pattern = Pattern.compile(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2036
                toSupplementaries("a 32-character-long pattern xxxx"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2037
            pattern = Pattern.compile(toSupplementaries("a 33-character-long pattern xxxxx"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2038
            pattern = Pattern.compile(toSupplementaries("a thirty four character long regex"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2039
            StringBuffer patternToBe = new StringBuffer(101*2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2040
            for (int i=0; i<100; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2041
                patternToBe.append(Character.toChars(Character.MIN_SUPPLEMENTARY_CODE_POINT
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2042
                                                     + 97 + i%26));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2043
            pattern = Pattern.compile(patternToBe.toString());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2044
        } catch (PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2045
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2046
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2047
        report("LongPattern");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2048
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2049
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2050
    private static void group0Test() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2051
        Pattern pattern = Pattern.compile("(tes)ting");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2052
        Matcher matcher = pattern.matcher("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2053
        check(matcher, "testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2054
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2055
        matcher.reset("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2056
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2057
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2058
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2059
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2060
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2061
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2062
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2063
        matcher.reset("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2064
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2065
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2066
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2067
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2068
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2069
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2071
        pattern = Pattern.compile("(tes)ting");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2072
        matcher = pattern.matcher("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2073
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2074
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2075
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2076
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2077
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2078
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2079
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2080
        pattern = Pattern.compile("^(tes)ting");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2081
        matcher = pattern.matcher("testing");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2082
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2083
            if (!matcher.group(0).equals("testing"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2084
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2085
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2086
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2087
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2088
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2089
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2090
        pattern = Pattern.compile(toSupplementaries("(tes)ting"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2091
        matcher = pattern.matcher(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2092
        check(matcher, toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2093
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2094
        matcher.reset(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2095
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2096
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2097
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2098
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2099
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2100
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2101
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2102
        matcher.reset(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2103
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2104
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2105
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2106
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2107
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2108
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2109
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2110
        pattern = Pattern.compile(toSupplementaries("(tes)ting"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2111
        matcher = pattern.matcher(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2112
        if (matcher.lookingAt()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2113
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2114
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2115
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2116
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2117
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2118
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2119
        pattern = Pattern.compile(toSupplementaries("^(tes)ting"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2120
        matcher = pattern.matcher(toSupplementaries("testing"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2121
        if (matcher.matches()) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2122
            if (!matcher.group(0).equals(toSupplementaries("testing")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2123
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2124
        } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2125
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2126
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2127
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2128
        report("Group0");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2129
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2131
    private static void findIntTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2132
        Pattern p = Pattern.compile("blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2133
        Matcher m = p.matcher("zzzzblahzzzzzblah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2134
        boolean result = m.find(2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2135
        if (!result)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2136
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2137
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2138
        p = Pattern.compile("$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2139
        m = p.matcher("1234567890");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2140
        result = m.find(10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2141
        if (!result)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2142
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2143
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2144
            result = m.find(11);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2145
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2146
        } catch (IndexOutOfBoundsException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2147
            // correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2148
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2149
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2150
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2151
        p = Pattern.compile(toSupplementaries("blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2152
        m = p.matcher(toSupplementaries("zzzzblahzzzzzblah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2153
        result = m.find(2);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2154
        if (!result)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2155
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2156
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2157
        report("FindInt");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2158
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2159
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2160
    private static void emptyPatternTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2161
        Pattern p = Pattern.compile("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2162
        Matcher m = p.matcher("foo");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2163
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2164
        // Should find empty pattern at beginning of input
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2165
        boolean result = m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2166
        if (result != true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2167
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2168
        if (m.start() != 0)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2169
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2170
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2171
        // Should not match entire input if input is not empty
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2172
        m.reset();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2173
        result = m.matches();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2174
        if (result == true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2175
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2176
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2177
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2178
            m.start(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2179
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2180
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2181
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2182
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2183
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2184
        // Should match entire input if input is empty
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2185
        m.reset("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2186
        result = m.matches();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2187
        if (result != true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2188
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2189
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2190
        result = Pattern.matches("", "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2191
        if (result != true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2192
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2193
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2194
        result = Pattern.matches("", "foo");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2195
        if (result == true)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2196
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2197
        report("EmptyPattern");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2198
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2199
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2200
    private static void charClassTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2201
        Pattern pattern = Pattern.compile("blah[ab]]blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2202
        check(pattern, "blahb]blech", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2203
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2204
        pattern = Pattern.compile("[abc[def]]");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2205
        check(pattern, "b", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2206
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2207
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2208
        pattern = Pattern.compile(toSupplementaries("blah[ab]]blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2209
        check(pattern, toSupplementaries("blahb]blech"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2210
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2211
        pattern = Pattern.compile(toSupplementaries("[abc[def]]"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2212
        check(pattern, toSupplementaries("b"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2213
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2214
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2215
            // u00ff when UNICODE_CASE
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2216
            pattern = Pattern.compile("[ab\u00ffcd]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2217
                                      Pattern.CASE_INSENSITIVE|
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2218
                                      Pattern.UNICODE_CASE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2219
            check(pattern, "ab\u00ffcd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2220
            check(pattern, "Ab\u0178Cd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2221
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2222
            // u00b5 when UNICODE_CASE
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2223
            pattern = Pattern.compile("[ab\u00b5cd]",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2224
                                      Pattern.CASE_INSENSITIVE|
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2225
                                      Pattern.UNICODE_CASE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2226
            check(pattern, "ab\u00b5cd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2227
            check(pattern, "Ab\u039cCd", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2228
        } catch (Exception e) { failCount++; }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2229
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2230
        /* Special cases
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2231
           (1)LatinSmallLetterLongS u+017f
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2232
           (2)LatinSmallLetterDotlessI u+0131
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2233
           (3)LatineCapitalLetterIWithDotAbove u+0130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2234
           (4)KelvinSign u+212a
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2235
           (5)AngstromSign u+212b
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2236
        */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2237
        int flags = Pattern.UNICODE_CASE | Pattern.CASE_INSENSITIVE;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2238
        pattern = Pattern.compile("[sik\u00c5]+", flags);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2239
        if (!pattern.matcher("\u017f\u0130\u0131\u212a\u212b").matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2240
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2241
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2242
        report("CharClass");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2243
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2244
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2245
    private static void caretTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2246
        Pattern pattern = Pattern.compile("\\w*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2247
        Matcher matcher = pattern.matcher("a#bc#def##g");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2248
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2249
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2250
        check(matcher, "bc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2251
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2252
        check(matcher, "def");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2253
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2254
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2255
        check(matcher, "g");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2256
        check(matcher, "");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2257
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2258
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2259
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2260
        pattern = Pattern.compile("^\\w*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2261
        matcher = pattern.matcher("a#bc#def##g");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2262
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2263
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2264
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2265
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2266
        pattern = Pattern.compile("\\w");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2267
        matcher = pattern.matcher("abc##x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2268
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2269
        check(matcher, "b");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2270
        check(matcher, "c");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2271
        check(matcher, "x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2272
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2273
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2274
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2275
        pattern = Pattern.compile("^\\w");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2276
        matcher = pattern.matcher("abc##x");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2277
        check(matcher, "a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2278
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2279
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2280
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2281
        pattern = Pattern.compile("\\A\\p{Alpha}{3}");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2282
        matcher = pattern.matcher("abcdef-ghi\njklmno");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2283
        check(matcher, "abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2284
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2285
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2286
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2287
        pattern = Pattern.compile("^\\p{Alpha}{3}", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2288
        matcher = pattern.matcher("abcdef-ghi\njklmno");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2289
        check(matcher, "abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2290
        check(matcher, "jkl");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2291
        if (matcher.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2292
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2293
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2294
        pattern = Pattern.compile("^", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2295
        matcher = pattern.matcher("this is some text");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2296
        String result = matcher.replaceAll("X");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2297
        if (!result.equals("Xthis is some text"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2298
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2299
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2300
        pattern = Pattern.compile("^");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2301
        matcher = pattern.matcher("this is some text");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2302
        result = matcher.replaceAll("X");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2303
        if (!result.equals("Xthis is some text"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2304
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2305
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2306
        pattern = Pattern.compile("^", Pattern.MULTILINE | Pattern.UNIX_LINES);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2307
        matcher = pattern.matcher("this is some text\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2308
        result = matcher.replaceAll("X");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2309
        if (!result.equals("Xthis is some text\n"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2310
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2311
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2312
        report("Caret");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2313
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2314
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2315
    private static void groupCaptureTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2316
        // Independent group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2317
        Pattern pattern = Pattern.compile("x+(?>y+)z+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2318
        Matcher matcher = pattern.matcher("xxxyyyzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2319
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2320
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2321
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2322
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2323
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2324
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2325
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2326
        // Pure group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2327
        pattern = Pattern.compile("x+(?:y+)z+");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2328
        matcher = pattern.matcher("xxxyyyzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2329
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2330
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2331
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2332
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2333
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2334
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2335
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2336
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2337
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2338
        // Independent group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2339
        pattern = Pattern.compile(toSupplementaries("x+(?>y+)z+"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2340
        matcher = pattern.matcher(toSupplementaries("xxxyyyzzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2341
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2342
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2343
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2344
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2345
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2346
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2347
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2348
        // Pure group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2349
        pattern = Pattern.compile(toSupplementaries("x+(?:y+)z+"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2350
        matcher = pattern.matcher(toSupplementaries("xxxyyyzzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2351
        matcher.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2352
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2353
            String blah = matcher.group(1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2354
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2355
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2356
            // Good result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2357
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2358
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2359
        report("GroupCapture");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2360
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2361
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2362
    private static void backRefTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2363
        Pattern pattern = Pattern.compile("(a*)bc\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2364
        check(pattern, "zzzaabcazzz", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2365
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2366
        pattern = Pattern.compile("(a*)bc\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2367
        check(pattern, "zzzaabcaazzz", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2368
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2369
        pattern = Pattern.compile("(abc)(def)\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2370
        check(pattern, "abcdefabc", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2371
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2372
        pattern = Pattern.compile("(abc)(def)\\3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2373
        check(pattern, "abcdefabc", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2374
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2375
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2376
            for (int i = 1; i < 10; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2377
                // Make sure backref 1-9 are always accepted
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2378
                pattern = Pattern.compile("abcdef\\" + i);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2379
                // and fail to match if the target group does not exit
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2380
                check(pattern, "abcdef", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2381
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2382
        } catch(PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2383
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2384
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2385
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2386
        pattern = Pattern.compile("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)\\11");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2387
        check(pattern, "abcdefghija", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2388
        check(pattern, "abcdefghija1", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2389
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2390
        pattern = Pattern.compile("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)(k)\\11");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2391
        check(pattern, "abcdefghijkk", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2392
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2393
        pattern = Pattern.compile("(a)bcdefghij\\11");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2394
        check(pattern, "abcdefghija1", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2395
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2396
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2397
        pattern = Pattern.compile(toSupplementaries("(a*)bc\\1"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2398
        check(pattern, toSupplementaries("zzzaabcazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2399
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2400
        pattern = Pattern.compile(toSupplementaries("(a*)bc\\1"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2401
        check(pattern, toSupplementaries("zzzaabcaazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2402
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2403
        pattern = Pattern.compile(toSupplementaries("(abc)(def)\\1"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2404
        check(pattern, toSupplementaries("abcdefabc"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2405
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2406
        pattern = Pattern.compile(toSupplementaries("(abc)(def)\\3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2407
        check(pattern, toSupplementaries("abcdefabc"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2408
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2409
        pattern = Pattern.compile(toSupplementaries("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)\\11"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2410
        check(pattern, toSupplementaries("abcdefghija"), false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2411
        check(pattern, toSupplementaries("abcdefghija1"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2412
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2413
        pattern = Pattern.compile(toSupplementaries("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)(k)\\11"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2414
        check(pattern, toSupplementaries("abcdefghijkk"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2415
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2416
        report("BackRef");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2417
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2418
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2419
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2420
     * Unicode Technical Report #18, section 2.6 End of Line
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2421
     * There is no empty line to be matched in the sequence \u000D\u000A
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2422
     * but there is an empty line in the sequence \u000A\u000D.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2423
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2424
    private static void anchorTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2425
        Pattern p = Pattern.compile("^.*$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2426
        Matcher m = p.matcher("blah1\r\nblah2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2427
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2428
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2429
        if (!m.group().equals("blah2"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2430
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2431
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2432
        m.reset("blah1\n\rblah2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2433
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2434
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2435
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2436
        if (!m.group().equals("blah2"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2437
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2438
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2439
        // Test behavior of $ with \r\n at end of input
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2440
        p = Pattern.compile(".+$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2441
        m = p.matcher("blah1\r\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2442
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2443
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2444
       if (!m.group().equals("blah1"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2445
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2446
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2447
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2448
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2449
        // Test behavior of $ with \r\n at end of input in multiline
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2450
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2451
        m = p.matcher("blah1\r\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2452
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2453
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2454
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2455
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2456
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2457
        // Test for $ recognition of \u0085 for bug 4527731
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2458
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2459
        m = p.matcher("blah1\u0085");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2460
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2461
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2462
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2463
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2464
        p = Pattern.compile("^.*$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2465
        m = p.matcher(toSupplementaries("blah1\r\nblah2"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2466
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2467
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2468
        if (!m.group().equals(toSupplementaries("blah2")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2469
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2470
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2471
        m.reset(toSupplementaries("blah1\n\rblah2"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2472
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2473
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2474
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2475
        if (!m.group().equals(toSupplementaries("blah2")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2476
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2477
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2478
        // Test behavior of $ with \r\n at end of input
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2479
        p = Pattern.compile(".+$");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2480
        m = p.matcher(toSupplementaries("blah1\r\n"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2481
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2482
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2483
        if (!m.group().equals(toSupplementaries("blah1")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2484
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2485
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2486
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2487
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2488
        // Test behavior of $ with \r\n at end of input in multiline
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2489
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2490
        m = p.matcher(toSupplementaries("blah1\r\n"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2491
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2492
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2493
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2494
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2495
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2496
        // Test for $ recognition of \u0085 for bug 4527731
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2497
        p = Pattern.compile(".+$", Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2498
        m = p.matcher(toSupplementaries("blah1\u0085"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2499
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2500
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2501
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2502
        report("Anchors");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2503
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2504
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2505
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2506
     * A basic sanity test of Matcher.lookingAt().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2507
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2508
    private static void lookingAtTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2509
        Pattern p = Pattern.compile("(ab)(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2510
        Matcher m = p.matcher("abccczzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2511
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2512
        if (!m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2513
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2514
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2515
        if (!m.group().equals(m.group(0)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2516
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2517
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2518
        m = p.matcher("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2519
        if (m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2520
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2521
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2522
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2523
        p = Pattern.compile(toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2524
        m = p.matcher(toSupplementaries("abccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2525
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2526
        if (!m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2527
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2528
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2529
        if (!m.group().equals(m.group(0)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2530
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2531
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2532
        m = p.matcher(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2533
        if (m.lookingAt())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2534
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2535
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2536
        report("Looking At");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2537
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2538
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2539
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2540
     * A basic sanity test of Matcher.matches().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2541
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2542
    private static void matchesTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2543
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2544
        Pattern p = Pattern.compile("ulb(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2545
        Matcher m = p.matcher("ulbcccccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2546
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2547
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2548
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2549
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2550
        m.reset("zzzulbcccccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2551
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2552
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2553
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2554
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2555
        m.reset("ulbccccccdef");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2556
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2557
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2558
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2559
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2560
        p = Pattern.compile("a|ad");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2561
        m = p.matcher("ad");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2562
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2563
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2564
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2565
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2566
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2567
        p = Pattern.compile(toSupplementaries("ulb(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2568
        m = p.matcher(toSupplementaries("ulbcccccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2569
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2570
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2571
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2572
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2573
        m.reset(toSupplementaries("zzzulbcccccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2574
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2575
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2576
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2577
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2578
        m.reset(toSupplementaries("ulbccccccdef"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2579
        if (m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2580
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2581
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2582
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2583
        p = Pattern.compile(toSupplementaries("a|ad"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2584
        m = p.matcher(toSupplementaries("ad"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2585
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2586
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2587
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2588
        report("Matches");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2589
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2590
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2591
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2592
     * A basic sanity test of Pattern.matches().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2593
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2594
    private static void patternMatchesTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2595
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2596
        if (!Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2597
                             toSupplementaries("ulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2598
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2599
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2600
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2601
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2602
                            toSupplementaries("zzzulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2603
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2604
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2605
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2606
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2607
                            toSupplementaries("ulbccccccdef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2608
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2609
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2610
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2611
        // matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2612
        if (!Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2613
                             toSupplementaries("ulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2614
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2615
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2616
        // find() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2617
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2618
                            toSupplementaries("zzzulbcccccc")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2619
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2620
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2621
        // lookingAt() but not matches()
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2622
        if (Pattern.matches(toSupplementaries("ulb(c*)"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2623
                            toSupplementaries("ulbccccccdef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2624
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2625
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2626
        report("Pattern Matches");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2627
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2628
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2629
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2630
     * Canonical equivalence testing. Tests the ability of the engine
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2631
     * to match sequences that are not explicitly specified in the
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2632
     * pattern when they are considered equivalent by the Unicode Standard.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2633
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2634
    private static void ceTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2635
        // Decomposed char outside char classes
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2636
        Pattern p = Pattern.compile("testa\u030a", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2637
        Matcher m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2638
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2639
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2640
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2641
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2642
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2643
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2644
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2645
        // Composed char outside char classes
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2646
        p = Pattern.compile("test\u00e5", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2647
        m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2648
        if (!m.matches())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2649
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2650
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2651
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2652
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2653
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2654
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2655
        // Decomposed char inside a char class
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2656
        p = Pattern.compile("test[abca\u030a]", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2657
        m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2658
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2659
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2660
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2661
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2662
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2663
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2664
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2665
        // Composed char inside a char class
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2666
        p = Pattern.compile("test[abc\u00e5def\u00e0]", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2667
        m = p.matcher("test\u00e5");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2668
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2669
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2670
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2671
        m.reset("testa\u0300");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2672
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2673
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2674
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2675
        m.reset("testa\u030a");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2676
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2677
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2678
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2679
        // Marks that cannot legally change order and be equivalent
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2680
        p = Pattern.compile("testa\u0308\u0300", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2681
        check(p, "testa\u0308\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2682
        check(p, "testa\u0300\u0308", false);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2683
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2684
        // Marks that can legally change order and be equivalent
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2685
        p = Pattern.compile("testa\u0308\u0323", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2686
        check(p, "testa\u0308\u0323", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2687
        check(p, "testa\u0323\u0308", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2688
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2689
        // Test all equivalences of the sequence a\u0308\u0323\u0300
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2690
        p = Pattern.compile("testa\u0308\u0323\u0300", Pattern.CANON_EQ);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2691
        check(p, "testa\u0308\u0323\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2692
        check(p, "testa\u0323\u0308\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2693
        check(p, "testa\u0308\u0300\u0323", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2694
        check(p, "test\u00e4\u0323\u0300", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2695
        check(p, "test\u00e4\u0300\u0323", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2696
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2697
        Object[][] data = new Object[][] {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2698
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2699
        // JDK-4867170
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2700
        { "[\u1f80-\u1f82]", "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2701
        { "[\u1f80-\u1f82]", "ab\u1f81cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2702
        { "[\u1f80-\u1f82]", "ab\u1f82cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2703
        { "[\u1f80-\u1f82]", "ab\u03b1\u0314\u0345cd", "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2704
        { "[\u1f80-\u1f82]", "ab\u03b1\u0345\u0314cd", "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2705
        { "[\u1f80-\u1f82]", "ab\u1f01\u0345cd",       "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2706
        { "[\u1f80-\u1f82]", "ab\u1f00\u0345cd",       "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2707
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2708
        { "\\p{IsGreek}",    "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2709
        { "\\p{IsGreek}",    "ab\u1f81cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2710
        { "\\p{IsGreek}",    "ab\u1f82cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2711
        { "\\p{IsGreek}",    "ab\u03b1\u0314\u0345cd", "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2712
        { "\\p{IsGreek}",    "ab\u1f01\u0345cd",       "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2713
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2714
        // backtracking, force to match "\u1f80", instead of \u1f82"
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2715
        { "ab\\p{IsGreek}\u0300cd", "ab\u03b1\u0313\u0345\u0300cd", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2716
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2717
        { "[\\p{IsGreek}]",  "\u03b1\u0314\u0345",     "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2718
        { "\\p{IsGreek}",    "\u03b1\u0314\u0345",     "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2719
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2720
        { "[^\u1f80-\u1f82]","\u1f81",                 "m", false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2721
        { "[^\u1f80-\u1f82]","\u03b1\u0314\u0345",     "m", false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2722
        { "[^\u1f01\u0345]", "\u1f81",                 "f", false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2723
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2724
        { "[^\u1f81]+",      "\u1f80\u1f82",           "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2725
        { "[\u1f80]",        "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2726
        { "\u1f80",          "ab\u1f80cd",             "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2727
        { "\u1f00\u0345\u0300",  "\u1f82", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2728
        { "\u1f80",          "-\u1f00\u0345\u0300-",   "f", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2729
        { "\u1f82",          "\u1f00\u0345\u0300",     "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2730
        { "\u1f82",          "\u1f80\u0300",           "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2731
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2732
        // JDK-7080302       # compile failed
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2733
        { "a(\u0041\u0301\u0328)", "a\u0041\u0301\u0328", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2734
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2735
        // JDK-6728861, same cause as above one
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2736
        { "\u00e9\u00e9n", "e\u0301e\u0301n", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2737
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2738
        // JDK-6995635
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2739
        { "(\u00e9)", "e\u0301", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2740
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2741
        // JDK-6736245
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2742
        // intereting special case, nfc(u2add+u0338) -> u2add+u0338) NOT u2adc
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2743
        { "\u2ADC", "\u2ADC", "m", true},          // NFC
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2744
        { "\u2ADC", "\u2ADD\u0338", "m", true},    // NFD
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2745
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2746
        //  4916384.
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2747
        // Decomposed hangul (jamos) works inside clazz
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2748
        { "[\u1100\u1161]", "\u1100\u1161", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2749
        { "[\u1100\u1161]", "\uac00", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2750
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2751
        { "[\uac00]", "\u1100\u1161", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2752
        { "[\uac00]", "\uac00", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2753
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2754
        // Decomposed hangul (jamos)
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2755
        { "\u1100\u1161", "\u1100\u1161", "m", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2756
        { "\u1100\u1161", "\uac00", "m", true},
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2757
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2758
        // Composed hangul
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2759
        { "\uac00",  "\u1100\u1161", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2760
        { "\uac00",  "\uac00", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2761
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2762
        /* Need a NFDSlice to nfd the source to solve this issue
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2763
           u+1d1c0 -> nfd: <u+1d1ba><u+1d165><u+1d16f>  -> nfc: <u+1d1ba><u+1d165><u+1d16f>
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2764
           u+1d1bc -> nfd: <u+1d1ba><u+1d165>           -> nfc: <u+1d1ba><u+1d165>
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2765
           <u+1d1bc><u+1d16f> -> nfd: <u+1d1ba><u+1d165><u+1d16f> -> nfc: <u+1d1ba><u+1d165><u+1d16f>
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2766
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2767
        // Decomposed supplementary outside char classes
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2768
        // { "test\ud834\uddbc\ud834\udd6f", "test\ud834\uddc0", "m", true },
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2769
        // Composed supplementary outside char classes
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2770
        // { "test\ud834\uddc0", "test\ud834\uddbc\ud834\udd6f", "m", true },
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2771
        */
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2772
        { "test\ud834\uddbc\ud834\udd6f", "test\ud834\uddbc\ud834\udd6f", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2773
        { "test\ud834\uddc0",             "test\ud834\uddbc\ud834\udd6f", "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2774
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2775
        { "test\ud834\uddc0",             "test\ud834\uddc0",             "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2776
        { "test\ud834\uddbc\ud834\udd6f", "test\ud834\uddc0",             "m", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2777
        };
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2778
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2779
        int failCount = 0;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2780
        for (Object[] d : data) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2781
            String pn = (String)d[0];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2782
            String tt = (String)d[1];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2783
            boolean isFind = "f".equals(((String)d[2]));
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2784
            boolean expected = (boolean)d[3];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2785
            boolean ret = isFind ? Pattern.compile(pn, Pattern.CANON_EQ).matcher(tt).find()
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2786
                                 : Pattern.compile(pn, Pattern.CANON_EQ).matcher(tt).matches();
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2787
            if (ret != expected) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2788
                failCount++;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2789
                continue;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2790
            }
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  2791
        }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2792
        report("Canonical Equivalence");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2793
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2794
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2795
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2796
     * A basic sanity test of Matcher.replaceAll().
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2797
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2798
    private static void globalSubstitute() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2799
        // Global substitution with a literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2800
        Pattern p = Pattern.compile("(ab)(c*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2801
        Matcher m = p.matcher("abccczzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2802
        if (!m.replaceAll("test").equals("testzzztestzzztest"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2803
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2804
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2805
        m.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2806
        if (!m.replaceAll("test").equals("zzztestzzztestzzztestzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2807
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2808
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2809
        // Global substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2810
        m.reset("zzzabccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2811
        String result = m.replaceAll("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2812
        if (!result.equals("zzzabzzzabzzzabzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2813
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2814
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2815
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2816
        // Global substitution with a literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2817
        p = Pattern.compile(toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2818
        m = p.matcher(toSupplementaries("abccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2819
        if (!m.replaceAll(toSupplementaries("test")).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2820
            equals(toSupplementaries("testzzztestzzztest")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2821
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2822
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2823
        m.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2824
        if (!m.replaceAll(toSupplementaries("test")).
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2825
            equals(toSupplementaries("zzztestzzztestzzztestzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2826
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2827
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2828
        // Global substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2829
        m.reset(toSupplementaries("zzzabccczzzabcczzzabccczzz"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2830
        result = m.replaceAll("$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2831
        if (!result.equals(toSupplementaries("zzzabzzzabzzzabzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2832
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2833
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2834
        report("Global Substitution");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2835
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2836
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2837
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2838
     * Tests the usage of Matcher.appendReplacement() with literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2839
     * and group substitutions.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2840
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2841
    private static void stringbufferSubstitute() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2842
        // SB substitution with literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2843
        String blah = "zzzblahzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2844
        Pattern p = Pattern.compile("blah");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2845
        Matcher m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2846
        StringBuffer result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2847
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2848
            m.appendReplacement(result, "blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2849
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2850
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2851
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2852
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2853
        m.appendReplacement(result, "blech");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2854
        if (!result.toString().equals("zzzblech"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2855
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2856
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2857
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2858
        if (!result.toString().equals("zzzblechzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2859
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2860
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2861
        // SB substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2862
        blah = "zzzabcdzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2863
        p = Pattern.compile("(ab)(cd)*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2864
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2865
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2866
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2867
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2868
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2869
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2870
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2871
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2872
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2873
        if (!result.toString().equals("zzzab"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2874
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2875
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2876
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2877
        if (!result.toString().equals("zzzabzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2878
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2879
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2880
        // SB substitution with 3 groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2881
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2882
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2883
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2884
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2885
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2886
            m.appendReplacement(result, "$1w$2w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2887
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2888
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2889
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2890
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2891
        m.appendReplacement(result, "$1w$2w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2892
        if (!result.toString().equals("zzzabwcdwef"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2893
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2894
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2895
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2896
        if (!result.toString().equals("zzzabwcdwefzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2897
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2898
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2899
        // SB substitution with groups and three matches
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2900
        // skipping middle match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2901
        blah = "zzzabcdzzzabcddzzzabcdzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2902
        p = Pattern.compile("(ab)(cd*)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2903
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2904
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2905
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2906
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2907
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2908
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2909
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2910
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2911
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2912
        if (!result.toString().equals("zzzab"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2913
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2914
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2915
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2916
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2917
        m.appendReplacement(result, "$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2918
        if (!result.toString().equals("zzzabzzzabcddzzzcd"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2919
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2920
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2921
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2922
        if (!result.toString().equals("zzzabzzzabcddzzzcdzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2923
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2924
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2925
        // Check to make sure escaped $ is ignored
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2926
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2927
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2928
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2929
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2930
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2931
        m.appendReplacement(result, "$1w\\$2w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2932
        if (!result.toString().equals("zzzabw$2wef"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2933
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2934
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2935
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2936
        if (!result.toString().equals("zzzabw$2wefzzz"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2937
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2938
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2939
        // Check to make sure a reference to nonexistent group causes error
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2940
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2941
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2942
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2943
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2944
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2945
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2946
            m.appendReplacement(result, "$1w$5w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2947
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2948
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2949
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2950
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2951
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2952
        // Check double digit group references
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2953
        blah = "zzz123456789101112zzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2954
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2955
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2956
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2957
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2958
        m.appendReplacement(result, "$1w$11w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2959
        if (!result.toString().equals("zzz1w11w3"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2960
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2961
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2962
        // Check to make sure it backs off $15 to $1 if only three groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2963
        blah = "zzzabcdcdefzzz";
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2964
        p = Pattern.compile("(ab)(cd)*(ef)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2965
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2966
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2967
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2968
        m.appendReplacement(result, "$1w$15w$3");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2969
        if (!result.toString().equals("zzzabwab5wef"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2970
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2971
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2972
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2973
        // Supplementary character test
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2974
        // SB substitution with literal
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2975
        blah = toSupplementaries("zzzblahzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2976
        p = Pattern.compile(toSupplementaries("blah"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2977
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2978
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2979
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2980
            m.appendReplacement(result, toSupplementaries("blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2981
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2982
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2983
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2984
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2985
        m.appendReplacement(result, toSupplementaries("blech"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2986
        if (!result.toString().equals(toSupplementaries("zzzblech")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2987
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2988
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2989
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2990
        if (!result.toString().equals(toSupplementaries("zzzblechzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2991
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2992
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2993
        // SB substitution with groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2994
        blah = toSupplementaries("zzzabcdzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2995
        p = Pattern.compile(toSupplementaries("(ab)(cd)*"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2996
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2997
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2998
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  2999
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3000
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3001
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3002
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3003
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3004
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3005
        if (!result.toString().equals(toSupplementaries("zzzab")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3006
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3007
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3008
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3009
        if (!result.toString().equals(toSupplementaries("zzzabzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3010
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3011
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3012
        // SB substitution with 3 groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3013
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3014
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3015
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3016
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3017
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3018
            m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3019
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3020
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3021
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3022
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3023
        m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3024
        if (!result.toString().equals(toSupplementaries("zzzabwcdwef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3025
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3026
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3027
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3028
        if (!result.toString().equals(toSupplementaries("zzzabwcdwefzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3029
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3030
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3031
        // SB substitution with groups and three matches
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3032
        // skipping middle match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3033
        blah = toSupplementaries("zzzabcdzzzabcddzzzabcdzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3034
        p = Pattern.compile(toSupplementaries("(ab)(cd*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3035
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3036
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3037
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3038
            m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3039
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3040
        } catch (IllegalStateException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3041
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3042
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3043
        m.appendReplacement(result, "$1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3044
        if (!result.toString().equals(toSupplementaries("zzzab")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3045
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3046
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3047
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3048
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3049
        m.appendReplacement(result, "$2");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3050
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcd")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3051
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3052
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3053
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3054
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcdzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3055
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3056
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3057
        // Check to make sure escaped $ is ignored
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3058
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3059
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3060
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3061
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3062
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3063
        m.appendReplacement(result, toSupplementaries("$1w\\$2w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3064
        if (!result.toString().equals(toSupplementaries("zzzabw$2wef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3065
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3066
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3067
        m.appendTail(result);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3068
        if (!result.toString().equals(toSupplementaries("zzzabw$2wefzzz")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3069
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3071
        // Check to make sure a reference to nonexistent group causes error
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3072
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3073
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3074
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3075
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3076
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3077
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3078
            m.appendReplacement(result, toSupplementaries("$1w$5w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3079
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3080
        } catch (IndexOutOfBoundsException ioobe) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3081
            // Correct result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3082
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3083
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3084
        // Check double digit group references
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3085
        blah = toSupplementaries("zzz123456789101112zzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3086
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3087
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3088
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3089
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3090
        m.appendReplacement(result, toSupplementaries("$1w$11w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3091
        if (!result.toString().equals(toSupplementaries("zzz1w11w3")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3092
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3093
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3094
        // Check to make sure it backs off $15 to $1 if only three groups
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3095
        blah = toSupplementaries("zzzabcdcdefzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3096
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3097
        m = p.matcher(blah);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3098
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3099
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3100
        m.appendReplacement(result, toSupplementaries("$1w$15w$3"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3101
        if (!result.toString().equals(toSupplementaries("zzzabwab5wef")))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3102
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3103
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3104
        // Check nothing has been appended into the output buffer if
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3105
        // the replacement string triggers IllegalArgumentException.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3106
        p = Pattern.compile("(abc)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3107
        m = p.matcher("abcd");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3108
        result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3109
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3110
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3111
            m.appendReplacement(result, ("xyz$g"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3112
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3113
        } catch (IllegalArgumentException iae) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3114
            if (result.length() != 0)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3115
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3116
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3117
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3118
        report("SB Substitution");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3119
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3120
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3121
    /**
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3122
     * Tests the usage of Matcher.appendReplacement() with literal
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3123
     * and group substitutions.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3124
     */
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3125
    private static void stringbuilderSubstitute() throws Exception {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3126
        // SB substitution with literal
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3127
        String blah = "zzzblahzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3128
        Pattern p = Pattern.compile("blah");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3129
        Matcher m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3130
        StringBuilder result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3131
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3132
            m.appendReplacement(result, "blech");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3133
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3134
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3135
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3136
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3137
        m.appendReplacement(result, "blech");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3138
        if (!result.toString().equals("zzzblech"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3139
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3140
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3141
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3142
        if (!result.toString().equals("zzzblechzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3143
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3144
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3145
        // SB substitution with groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3146
        blah = "zzzabcdzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3147
        p = Pattern.compile("(ab)(cd)*");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3148
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3149
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3150
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3151
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3152
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3153
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3154
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3155
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3156
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3157
        if (!result.toString().equals("zzzab"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3158
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3159
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3160
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3161
        if (!result.toString().equals("zzzabzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3162
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3163
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3164
        // SB substitution with 3 groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3165
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3166
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3167
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3168
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3169
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3170
            m.appendReplacement(result, "$1w$2w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3171
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3172
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3173
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3174
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3175
        m.appendReplacement(result, "$1w$2w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3176
        if (!result.toString().equals("zzzabwcdwef"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3177
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3178
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3179
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3180
        if (!result.toString().equals("zzzabwcdwefzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3181
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3182
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3183
        // SB substitution with groups and three matches
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3184
        // skipping middle match
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3185
        blah = "zzzabcdzzzabcddzzzabcdzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3186
        p = Pattern.compile("(ab)(cd*)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3187
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3188
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3189
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3190
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3191
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3192
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3193
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3194
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3195
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3196
        if (!result.toString().equals("zzzab"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3197
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3198
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3199
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3200
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3201
        m.appendReplacement(result, "$2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3202
        if (!result.toString().equals("zzzabzzzabcddzzzcd"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3203
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3204
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3205
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3206
        if (!result.toString().equals("zzzabzzzabcddzzzcdzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3207
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3208
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3209
        // Check to make sure escaped $ is ignored
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3210
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3211
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3212
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3213
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3214
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3215
        m.appendReplacement(result, "$1w\\$2w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3216
        if (!result.toString().equals("zzzabw$2wef"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3217
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3218
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3219
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3220
        if (!result.toString().equals("zzzabw$2wefzzz"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3221
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3222
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3223
        // Check to make sure a reference to nonexistent group causes error
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3224
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3225
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3226
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3227
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3228
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3229
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3230
            m.appendReplacement(result, "$1w$5w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3231
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3232
        } catch (IndexOutOfBoundsException ioobe) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3233
            // Correct result
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3234
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3235
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3236
        // Check double digit group references
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3237
        blah = "zzz123456789101112zzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3238
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3239
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3240
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3241
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3242
        m.appendReplacement(result, "$1w$11w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3243
        if (!result.toString().equals("zzz1w11w3"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3244
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3245
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3246
        // Check to make sure it backs off $15 to $1 if only three groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3247
        blah = "zzzabcdcdefzzz";
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3248
        p = Pattern.compile("(ab)(cd)*(ef)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3249
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3250
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3251
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3252
        m.appendReplacement(result, "$1w$15w$3");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3253
        if (!result.toString().equals("zzzabwab5wef"))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3254
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3255
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3256
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3257
        // Supplementary character test
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3258
        // SB substitution with literal
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3259
        blah = toSupplementaries("zzzblahzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3260
        p = Pattern.compile(toSupplementaries("blah"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3261
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3262
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3263
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3264
            m.appendReplacement(result, toSupplementaries("blech"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3265
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3266
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3267
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3268
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3269
        m.appendReplacement(result, toSupplementaries("blech"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3270
        if (!result.toString().equals(toSupplementaries("zzzblech")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3271
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3272
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3273
        if (!result.toString().equals(toSupplementaries("zzzblechzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3274
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3275
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3276
        // SB substitution with groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3277
        blah = toSupplementaries("zzzabcdzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3278
        p = Pattern.compile(toSupplementaries("(ab)(cd)*"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3279
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3280
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3281
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3282
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3283
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3284
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3285
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3286
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3287
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3288
        if (!result.toString().equals(toSupplementaries("zzzab")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3289
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3290
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3291
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3292
        if (!result.toString().equals(toSupplementaries("zzzabzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3293
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3294
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3295
        // SB substitution with 3 groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3296
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3297
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3298
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3299
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3300
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3301
            m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3302
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3303
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3304
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3305
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3306
        m.appendReplacement(result, toSupplementaries("$1w$2w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3307
        if (!result.toString().equals(toSupplementaries("zzzabwcdwef")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3308
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3309
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3310
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3311
        if (!result.toString().equals(toSupplementaries("zzzabwcdwefzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3312
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3313
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3314
        // SB substitution with groups and three matches
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3315
        // skipping middle match
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3316
        blah = toSupplementaries("zzzabcdzzzabcddzzzabcdzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3317
        p = Pattern.compile(toSupplementaries("(ab)(cd*)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3318
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3319
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3320
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3321
            m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3322
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3323
        } catch (IllegalStateException e) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3324
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3325
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3326
        m.appendReplacement(result, "$1");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3327
        if (!result.toString().equals(toSupplementaries("zzzab")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3328
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3329
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3330
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3331
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3332
        m.appendReplacement(result, "$2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3333
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcd")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3334
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3335
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3336
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3337
        if (!result.toString().equals(toSupplementaries("zzzabzzzabcddzzzcdzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3338
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3339
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3340
        // Check to make sure escaped $ is ignored
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3341
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3342
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3343
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3344
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3345
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3346
        m.appendReplacement(result, toSupplementaries("$1w\\$2w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3347
        if (!result.toString().equals(toSupplementaries("zzzabw$2wef")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3348
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3349
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3350
        m.appendTail(result);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3351
        if (!result.toString().equals(toSupplementaries("zzzabw$2wefzzz")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3352
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3353
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3354
        // Check to make sure a reference to nonexistent group causes error
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3355
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3356
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3357
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3358
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3359
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3360
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3361
            m.appendReplacement(result, toSupplementaries("$1w$5w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3362
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3363
        } catch (IndexOutOfBoundsException ioobe) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3364
            // Correct result
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3365
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3366
        // Check double digit group references
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3367
        blah = toSupplementaries("zzz123456789101112zzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3368
        p = Pattern.compile("(1)(2)(3)(4)(5)(6)(7)(8)(9)(10)(11)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3369
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3370
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3371
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3372
        m.appendReplacement(result, toSupplementaries("$1w$11w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3373
        if (!result.toString().equals(toSupplementaries("zzz1w11w3")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3374
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3375
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3376
        // Check to make sure it backs off $15 to $1 if only three groups
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3377
        blah = toSupplementaries("zzzabcdcdefzzz");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3378
        p = Pattern.compile(toSupplementaries("(ab)(cd)*(ef)"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3379
        m = p.matcher(blah);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3380
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3381
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3382
        m.appendReplacement(result, toSupplementaries("$1w$15w$3"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3383
        if (!result.toString().equals(toSupplementaries("zzzabwab5wef")))
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3384
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3385
        // Check nothing has been appended into the output buffer if
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3386
        // the replacement string triggers IllegalArgumentException.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3387
        p = Pattern.compile("(abc)");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3388
        m = p.matcher("abcd");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3389
        result = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3390
        m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3391
        try {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3392
            m.appendReplacement(result, ("xyz$g"));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3393
            failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3394
        } catch (IllegalArgumentException iae) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3395
            if (result.length() != 0)
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3396
                failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3397
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3398
        report("SB Substitution 2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3399
    }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3400
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3401
    /*
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3402
     * 5 groups of characters are created to make a substitution string.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3403
     * A base string will be created including random lead chars, the
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3404
     * substitution string, and random trailing chars.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3405
     * A pattern containing the 5 groups is searched for and replaced with:
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3406
     * random group + random string + random group.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3407
     * The results are checked for correctness.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3408
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3409
    private static void substitutionBasher() {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3410
        for (int runs = 0; runs<1000; runs++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3411
            // Create a base string to work in
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3412
            int leadingChars = generator.nextInt(10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3413
            StringBuffer baseBuffer = new StringBuffer(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3414
            String leadingString = getRandomAlphaString(leadingChars);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3415
            baseBuffer.append(leadingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3416
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3417
            // Create 5 groups of random number of random chars
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3418
            // Create the string to substitute
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3419
            // Create the pattern string to search for
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3420
            StringBuffer bufferToSub = new StringBuffer(25);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3421
            StringBuffer bufferToPat = new StringBuffer(50);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3422
            String[] groups = new String[5];
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3423
            for(int i=0; i<5; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3424
                int aGroupSize = generator.nextInt(5)+1;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3425
                groups[i] = getRandomAlphaString(aGroupSize);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3426
                bufferToSub.append(groups[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3427
                bufferToPat.append('(');
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3428
                bufferToPat.append(groups[i]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3429
                bufferToPat.append(')');
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3430
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3431
            String stringToSub = bufferToSub.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3432
            String pattern = bufferToPat.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3433
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3434
            // Place sub string into working string at random index
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3435
            baseBuffer.append(stringToSub);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3436
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3437
            // Append random chars to end
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3438
            int trailingChars = generator.nextInt(10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3439
            String trailingString = getRandomAlphaString(trailingChars);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3440
            baseBuffer.append(trailingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3441
            String baseString = baseBuffer.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3442
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3443
            // Create test pattern and matcher
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3444
            Pattern p = Pattern.compile(pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3445
            Matcher m = p.matcher(baseString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3446
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3447
            // Reject candidate if pattern happens to start early
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3448
            m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3449
            if (m.start() < leadingChars)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3450
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3451
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3452
            // Reject candidate if more than one match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3453
            if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3454
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3455
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3456
            // Construct a replacement string with :
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3457
            // random group + random string + random group
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3458
            StringBuffer bufferToRep = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3459
            int groupIndex1 = generator.nextInt(5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3460
            bufferToRep.append("$" + (groupIndex1 + 1));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3461
            String randomMidString = getRandomAlphaString(5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3462
            bufferToRep.append(randomMidString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3463
            int groupIndex2 = generator.nextInt(5);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3464
            bufferToRep.append("$" + (groupIndex2 + 1));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3465
            String replacement = bufferToRep.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3466
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3467
            // Do the replacement
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3468
            String result = m.replaceAll(replacement);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3469
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3470
            // Construct expected result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3471
            StringBuffer bufferToRes = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3472
            bufferToRes.append(leadingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3473
            bufferToRes.append(groups[groupIndex1]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3474
            bufferToRes.append(randomMidString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3475
            bufferToRes.append(groups[groupIndex2]);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3476
            bufferToRes.append(trailingString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3477
            String expectedResult = bufferToRes.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3478
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3479
            // Check results
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3480
            if (!result.equals(expectedResult))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3481
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3482
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3483
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3484
        report("Substitution Basher");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3485
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3486
23734
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3487
    /*
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3488
     * 5 groups of characters are created to make a substitution string.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3489
     * A base string will be created including random lead chars, the
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3490
     * substitution string, and random trailing chars.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3491
     * A pattern containing the 5 groups is searched for and replaced with:
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3492
     * random group + random string + random group.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3493
     * The results are checked for correctness.
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3494
     */
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3495
    private static void substitutionBasher2() {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3496
        for (int runs = 0; runs<1000; runs++) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3497
            // Create a base string to work in
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3498
            int leadingChars = generator.nextInt(10);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3499
            StringBuilder baseBuffer = new StringBuilder(100);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3500
            String leadingString = getRandomAlphaString(leadingChars);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3501
            baseBuffer.append(leadingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3502
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3503
            // Create 5 groups of random number of random chars
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3504
            // Create the string to substitute
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3505
            // Create the pattern string to search for
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3506
            StringBuilder bufferToSub = new StringBuilder(25);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3507
            StringBuilder bufferToPat = new StringBuilder(50);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3508
            String[] groups = new String[5];
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3509
            for(int i=0; i<5; i++) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3510
                int aGroupSize = generator.nextInt(5)+1;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3511
                groups[i] = getRandomAlphaString(aGroupSize);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3512
                bufferToSub.append(groups[i]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3513
                bufferToPat.append('(');
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3514
                bufferToPat.append(groups[i]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3515
                bufferToPat.append(')');
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3516
            }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3517
            String stringToSub = bufferToSub.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3518
            String pattern = bufferToPat.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3519
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3520
            // Place sub string into working string at random index
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3521
            baseBuffer.append(stringToSub);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3522
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3523
            // Append random chars to end
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3524
            int trailingChars = generator.nextInt(10);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3525
            String trailingString = getRandomAlphaString(trailingChars);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3526
            baseBuffer.append(trailingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3527
            String baseString = baseBuffer.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3528
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3529
            // Create test pattern and matcher
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3530
            Pattern p = Pattern.compile(pattern);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3531
            Matcher m = p.matcher(baseString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3532
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3533
            // Reject candidate if pattern happens to start early
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3534
            m.find();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3535
            if (m.start() < leadingChars)
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3536
                continue;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3537
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3538
            // Reject candidate if more than one match
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3539
            if (m.find())
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3540
                continue;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3541
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3542
            // Construct a replacement string with :
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3543
            // random group + random string + random group
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3544
            StringBuilder bufferToRep = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3545
            int groupIndex1 = generator.nextInt(5);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3546
            bufferToRep.append("$" + (groupIndex1 + 1));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3547
            String randomMidString = getRandomAlphaString(5);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3548
            bufferToRep.append(randomMidString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3549
            int groupIndex2 = generator.nextInt(5);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3550
            bufferToRep.append("$" + (groupIndex2 + 1));
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3551
            String replacement = bufferToRep.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3552
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3553
            // Do the replacement
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3554
            String result = m.replaceAll(replacement);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3555
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3556
            // Construct expected result
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3557
            StringBuilder bufferToRes = new StringBuilder();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3558
            bufferToRes.append(leadingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3559
            bufferToRes.append(groups[groupIndex1]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3560
            bufferToRes.append(randomMidString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3561
            bufferToRes.append(groups[groupIndex2]);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3562
            bufferToRes.append(trailingString);
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3563
            String expectedResult = bufferToRes.toString();
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3564
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3565
            // Check results
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3566
            if (!result.equals(expectedResult)) {
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3567
                failCount++;
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3568
            }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3569
        }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3570
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3571
        report("Substitution Basher 2");
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3572
    }
439905b27f94 8039124: j.u.regex.Matcher.appendReplace/Tail() should support StringBuilder variant
sherman
parents: 22997
diff changeset
  3573
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3574
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3575
     * Checks the handling of some escape sequences that the Pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3576
     * class should process instead of the java compiler. These are
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3577
     * not in the file because the escapes should be be processed
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3578
     * by the Pattern class when the regex is compiled.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3579
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3580
    private static void escapes() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3581
        Pattern p = Pattern.compile("\\043");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3582
        Matcher m = p.matcher("#");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3583
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3584
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3585
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3586
        p = Pattern.compile("\\x23");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3587
        m = p.matcher("#");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3588
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3589
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3590
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3591
        p = Pattern.compile("\\u0023");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3592
        m = p.matcher("#");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3593
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3594
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3595
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3596
        report("Escape sequences");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3597
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3598
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3599
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3600
     * Checks the handling of blank input situations. These
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3601
     * tests are incompatible with my test file format.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3602
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3603
    private static void blankInput() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3604
        Pattern p = Pattern.compile("abc", Pattern.CASE_INSENSITIVE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3605
        Matcher m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3606
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3607
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3608
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3609
        p = Pattern.compile("a*", Pattern.CASE_INSENSITIVE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3610
        m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3611
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3612
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3613
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3614
        p = Pattern.compile("abc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3615
        m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3616
        if (m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3617
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3618
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3619
        p = Pattern.compile("a*");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3620
        m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3621
        if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3622
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3623
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3624
        report("Blank input");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3625
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3626
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3627
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3628
     * Tests the Boyer-Moore pattern matching of a character sequence
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3629
     * on randomly generated patterns.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3630
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3631
    private static void bm() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3632
        doBnM('a');
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3633
        report("Boyer Moore (ASCII)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3634
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3635
        doBnM(Character.MIN_SUPPLEMENTARY_CODE_POINT - 10);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3636
        report("Boyer Moore (Supplementary)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3637
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3638
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3639
    private static void doBnM(int baseCharacter) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3640
        int achar=0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3641
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3642
        for (int i=0; i<100; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3643
            // Create a short pattern to search for
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3644
            int patternLength = generator.nextInt(7) + 4;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3645
            StringBuffer patternBuffer = new StringBuffer(patternLength);
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3646
            String pattern;
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3647
            retry: for (;;) {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3648
                for (int x=0; x<patternLength; x++) {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3649
                    int ch = baseCharacter + generator.nextInt(26);
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3650
                    if (Character.isSupplementaryCodePoint(ch)) {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3651
                        patternBuffer.append(Character.toChars(ch));
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3652
                    } else {
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3653
                        patternBuffer.append((char)ch);
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3654
                    }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3655
                }
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3656
                pattern = patternBuffer.toString();
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3657
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3658
                // Avoid patterns that start and end with the same substring
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3659
                // See JDK-6854417
34436
33c20335507c 8143854: java/util/regex/RegExTest.java.RegExTest failed
sherman
parents: 31645
diff changeset
  3660
                for (int x=1; x < pattern.length(); x++) {
31645
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3661
                    if (pattern.startsWith(pattern.substring(x)))
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3662
                        continue retry;
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3663
                }
26db68d6758c 6854417: TESTBUG: java/util/regex/RegExTest.java fails intermittently
igerasim
parents: 30436
diff changeset
  3664
                break;
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3665
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3666
            Pattern p = Pattern.compile(pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3667
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3668
            // Create a buffer with random ASCII chars that does
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3669
            // not match the sample
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3670
            String toSearch = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3671
            StringBuffer s = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3672
            Matcher m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3673
            do {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3674
                s = new StringBuffer(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3675
                for (int x=0; x<100; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3676
                    int ch = baseCharacter + generator.nextInt(26);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3677
                    if (Character.isSupplementaryCodePoint(ch)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3678
                        s.append(Character.toChars(ch));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3679
                    } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3680
                        s.append((char)ch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3681
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3682
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3683
                toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3684
                m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3685
            } while (m.find());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3686
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3687
            // Insert the pattern at a random spot
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3688
            int insertIndex = generator.nextInt(99);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3689
            if (Character.isLowSurrogate(s.charAt(insertIndex)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3690
                insertIndex++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3691
            s = s.insert(insertIndex, pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3692
            toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3693
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3694
            // Make sure that the pattern is found
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3695
            m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3696
            if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3697
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3698
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3699
            // Make sure that the match text is the pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3700
            if (!m.group().equals(pattern))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3701
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3702
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3703
            // Make sure match occured at insertion point
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3704
            if (m.start() != insertIndex)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3705
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3706
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3707
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3708
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3709
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3710
     * Tests the matching of slices on randomly generated patterns.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3711
     * The Boyer-Moore optimization is not done on these patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3712
     * because it uses unicode case folding.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3713
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3714
    private static void slice() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3715
        doSlice(Character.MAX_VALUE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3716
        report("Slice");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3717
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3718
        doSlice(Character.MAX_CODE_POINT);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3719
        report("Slice (Supplementary)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3720
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3721
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3722
    private static void doSlice(int maxCharacter) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3723
        Random generator = new Random();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3724
        int achar=0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3725
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3726
        for (int i=0; i<100; i++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3727
            // Create a short pattern to search for
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3728
            int patternLength = generator.nextInt(7) + 4;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3729
            StringBuffer patternBuffer = new StringBuffer(patternLength);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3730
            for (int x=0; x<patternLength; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3731
                int randomChar = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3732
                while (!Character.isLetterOrDigit(randomChar))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3733
                    randomChar = generator.nextInt(maxCharacter);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3734
                if (Character.isSupplementaryCodePoint(randomChar)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3735
                    patternBuffer.append(Character.toChars(randomChar));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3736
                } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3737
                    patternBuffer.append((char) randomChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3738
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3739
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3740
            String pattern =  patternBuffer.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3741
            Pattern p = Pattern.compile(pattern, Pattern.UNICODE_CASE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3742
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3743
            // Create a buffer with random chars that does not match the sample
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3744
            String toSearch = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3745
            StringBuffer s = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3746
            Matcher m = p.matcher("");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3747
            do {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3748
                s = new StringBuffer(100);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3749
                for (int x=0; x<100; x++) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3750
                    int randomChar = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3751
                    while (!Character.isLetterOrDigit(randomChar))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3752
                        randomChar = generator.nextInt(maxCharacter);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3753
                    if (Character.isSupplementaryCodePoint(randomChar)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3754
                        s.append(Character.toChars(randomChar));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3755
                    } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3756
                        s.append((char) randomChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3757
                    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3758
                }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3759
                toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3760
                m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3761
            } while (m.find());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3762
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3763
            // Insert the pattern at a random spot
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3764
            int insertIndex = generator.nextInt(99);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3765
            if (Character.isLowSurrogate(s.charAt(insertIndex)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3766
                insertIndex++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3767
            s = s.insert(insertIndex, pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3768
            toSearch = s.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3769
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3770
            // Make sure that the pattern is found
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3771
            m.reset(toSearch);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3772
            if (!m.find())
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3773
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3774
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3775
            // Make sure that the match text is the pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3776
            if (!m.group().equals(pattern))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3777
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3778
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3779
            // Make sure match occured at insertion point
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3780
            if (m.start() != insertIndex)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3781
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3782
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3783
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3784
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3785
    private static void explainFailure(String pattern, String data,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3786
                                       String expected, String actual) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3787
        System.err.println("----------------------------------------");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3788
        System.err.println("Pattern = "+pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3789
        System.err.println("Data = "+data);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3790
        System.err.println("Expected = " + expected);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3791
        System.err.println("Actual   = " + actual);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3792
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3793
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3794
    private static void explainFailure(String pattern, String data,
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3795
                                       Throwable t) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3796
        System.err.println("----------------------------------------");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3797
        System.err.println("Pattern = "+pattern);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3798
        System.err.println("Data = "+data);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3799
        t.printStackTrace(System.err);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3800
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3801
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3802
    // Testing examples from a file
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3803
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3804
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3805
     * Goes through the file "TestCases.txt" and creates many patterns
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3806
     * described in the file, matching the patterns against input lines in
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3807
     * the file, and comparing the results against the correct results
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3808
     * also found in the file. The file format is described in comments
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3809
     * at the head of the file.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3810
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3811
    private static void processFile(String fileName) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3812
        File testCases = new File(System.getProperty("test.src", "."),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3813
                                  fileName);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3814
        FileInputStream in = new FileInputStream(testCases);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3815
        BufferedReader r = new BufferedReader(new InputStreamReader(in));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3816
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3817
        // Process next test case.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3818
        String aLine;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3819
        while((aLine = r.readLine()) != null) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3820
            // Read a line for pattern
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3821
            String patternString = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3822
            Pattern p = null;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3823
            try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3824
                p = compileTestPattern(patternString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3825
            } catch (PatternSyntaxException e) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3826
                String dataString = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3827
                String expectedResult = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3828
                if (expectedResult.startsWith("error"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3829
                    continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3830
                explainFailure(patternString, dataString, e);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3831
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3832
                continue;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3833
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3834
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3835
            // Read a line for input string
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3836
            String dataString = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3837
            Matcher m = p.matcher(dataString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3838
            StringBuffer result = new StringBuffer();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3839
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3840
            // Check for IllegalStateExceptions before a match
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3841
            failCount += preMatchInvariants(m);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3842
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3843
            boolean found = m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3844
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3845
            if (found)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3846
                failCount += postTrueMatchInvariants(m);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3847
            else
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3848
                failCount += postFalseMatchInvariants(m);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3849
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3850
            if (found) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3851
                result.append("true ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3852
                result.append(m.group(0) + " ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3853
            } else {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3854
                result.append("false ");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3855
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3856
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3857
            result.append(m.groupCount());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3858
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3859
            if (found) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3860
                for (int i=1; i<m.groupCount()+1; i++)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3861
                    if (m.group(i) != null)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3862
                        result.append(" " +m.group(i));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3863
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3864
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3865
            // Read a line for the expected result
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3866
            String expectedResult = grabLine(r);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3867
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3868
            if (!result.toString().equals(expectedResult)) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3869
                explainFailure(patternString, dataString, expectedResult, result.toString());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3870
                failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3871
            }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3872
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3873
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3874
        report(fileName);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3875
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3876
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3877
    private static int preMatchInvariants(Matcher m) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3878
        int failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3879
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3880
            m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3881
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3882
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3883
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3884
            m.end();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3885
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3886
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3887
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3888
            m.group();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3889
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3890
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3891
        return failCount;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3892
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3893
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3894
    private static int postFalseMatchInvariants(Matcher m) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3895
        int failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3896
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3897
            m.group();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3898
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3899
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3900
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3901
            m.start();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3902
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3903
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3904
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3905
            m.end();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3906
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3907
        } catch (IllegalStateException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3908
        return failCount;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3909
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3910
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3911
    private static int postTrueMatchInvariants(Matcher m) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3912
        int failCount = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3913
        //assert(m.start() = m.start(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3914
        if (m.start() != m.start(0))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3915
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3916
        //assert(m.end() = m.end(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3917
        if (m.start() != m.start(0))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3918
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3919
        //assert(m.group() = m.group(0);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3920
        if (!m.group().equals(m.group(0)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3921
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3922
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3923
            m.group(50);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3924
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3925
        } catch (IndexOutOfBoundsException ise) {}
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3926
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3927
        return failCount;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3928
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3929
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3930
    private static Pattern compileTestPattern(String patternString) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3931
        if (!patternString.startsWith("'")) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3932
            return Pattern.compile(patternString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3933
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3934
        int break1 = patternString.lastIndexOf("'");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3935
        String flagString = patternString.substring(
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3936
                                          break1+1, patternString.length());
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3937
        patternString = patternString.substring(1, break1);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3938
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3939
        if (flagString.equals("i"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3940
            return Pattern.compile(patternString, Pattern.CASE_INSENSITIVE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3941
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3942
        if (flagString.equals("m"))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3943
            return Pattern.compile(patternString, Pattern.MULTILINE);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3944
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3945
        return Pattern.compile(patternString);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3946
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3947
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3948
    /**
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3949
     * Reads a line from the input file. Keeps reading lines until a non
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3950
     * empty non comment line is read. If the line contains a \n then
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3951
     * these two characters are replaced by a newline char. If a \\uxxxx
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3952
     * sequence is read then the sequence is replaced by the unicode char.
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3953
     */
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3954
    private static String grabLine(BufferedReader r) throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3955
        int index = 0;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3956
        String line = r.readLine();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3957
        while (line.startsWith("//") || line.length() < 1)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3958
            line = r.readLine();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3959
        while ((index = line.indexOf("\\n")) != -1) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3960
            StringBuffer temp = new StringBuffer(line);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3961
            temp.replace(index, index+2, "\n");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3962
            line = temp.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3963
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3964
        while ((index = line.indexOf("\\u")) != -1) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3965
            StringBuffer temp = new StringBuffer(line);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3966
            String value = temp.substring(index+2, index+6);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3967
            char aChar = (char)Integer.parseInt(value, 16);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3968
            String unicodeChar = "" + aChar;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3969
            temp.replace(index, index+6, unicodeChar);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3970
            line = temp.toString();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3971
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3972
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3973
        return line;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3974
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3975
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3976
    private static void check(Pattern p, String s, String g, String expected) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3977
        Matcher m = p.matcher(s);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3978
        m.find();
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3979
        if (!m.group(g).equals(expected) ||
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3980
            s.charAt(m.start(g)) != expected.charAt(0) ||
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  3981
            s.charAt(m.end(g) - 1) != expected.charAt(expected.length() - 1))
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3982
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3983
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3984
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3985
    private static void checkReplaceFirst(String p, String s, String r, String expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3986
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3987
        if (!expected.equals(Pattern.compile(p)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3988
                                    .matcher(s)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3989
                                    .replaceFirst(r)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3990
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3991
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3992
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3993
    private static void checkReplaceAll(String p, String s, String r, String expected)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3994
    {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3995
        if (!expected.equals(Pattern.compile(p)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3996
                                    .matcher(s)
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3997
                                    .replaceAll(r)))
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3998
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  3999
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4000
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4001
    private static void checkExpectedFail(String p) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4002
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4003
            Pattern.compile(p);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4004
        } catch (PatternSyntaxException pse) {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4005
            //pse.printStackTrace();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4006
            return;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4007
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4008
        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4009
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4010
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4011
    private static void checkExpectedIAE(Matcher m, String g) {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4012
        m.find();
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4013
        try {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4014
            m.group(g);
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4015
        } catch (IllegalArgumentException x) {
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4016
            //iae.printStackTrace();
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4017
            try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4018
                m.start(g);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4019
            } catch (IllegalArgumentException xx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4020
                try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4021
                    m.start(g);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4022
                } catch (IllegalArgumentException xxx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4023
                    return;
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4024
                }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4025
            }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4026
        }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4027
        failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4028
    }
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4029
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4030
    private static void checkExpectedNPE(Matcher m) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4031
        m.find();
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4032
        try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4033
            m.group(null);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4034
        } catch (NullPointerException x) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4035
            try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4036
                m.start(null);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4037
            } catch (NullPointerException xx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4038
                try {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4039
                    m.end(null);
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4040
                } catch (NullPointerException xxx) {
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4041
                    return;
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4042
                }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4043
            }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4044
        }
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4045
        failCount++;
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4046
    }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4047
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4048
    private static void namedGroupCaptureTest() throws Exception {
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4049
        check(Pattern.compile("x+(?<gname>y+)z+"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4050
              "xxxyyyzzz",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4051
              "gname",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4052
              "yyy");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4053
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4054
        check(Pattern.compile("x+(?<gname8>y+)z+"),
2290
3a3bde061968 6817475: named-capturing group name started with digit causes PSE exception
sherman
parents: 2070
diff changeset
  4055
              "xxxyyyzzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4056
              "gname8",
2290
3a3bde061968 6817475: named-capturing group name started with digit causes PSE exception
sherman
parents: 2070
diff changeset
  4057
              "yyy");
3a3bde061968 6817475: named-capturing group name started with digit causes PSE exception
sherman
parents: 2070
diff changeset
  4058
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4059
        //backref
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4060
        Pattern pattern = Pattern.compile("(a*)bc\\1");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4061
        check(pattern, "zzzaabcazzz", true);  // found "abca"
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4062
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4063
        check(Pattern.compile("(?<gname>a*)bc\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4064
              "zzzaabcaazzz", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4065
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4066
        check(Pattern.compile("(?<gname>abc)(def)\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4067
              "abcdefabc", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4068
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4069
        check(Pattern.compile("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)(?<gname>k)\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4070
              "abcdefghijkk", true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4071
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4072
        // Supplementary character tests
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4073
        check(Pattern.compile("(?<gname>" + toSupplementaries("a*)bc") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4074
              toSupplementaries("zzzaabcazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4075
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4076
        check(Pattern.compile("(?<gname>" + toSupplementaries("a*)bc") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4077
              toSupplementaries("zzzaabcaazzz"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4078
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4079
        check(Pattern.compile("(?<gname>" + toSupplementaries("abc)(def)") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4080
              toSupplementaries("abcdefabc"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4081
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4082
        check(Pattern.compile(toSupplementaries("(a)(b)(c)(d)(e)(f)(g)(h)(i)(j)") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4083
                              "(?<gname>" +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4084
                              toSupplementaries("k)") + "\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4085
              toSupplementaries("abcdefghijkk"), true);
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4086
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4087
        check(Pattern.compile("x+(?<gname>y+)z+\\k<gname>"),
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4088
              "xxxyyyzzzyyy",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4089
              "gname",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4090
              "yyy");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4091
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4092
        //replaceFirst/All
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4093
        checkReplaceFirst("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4094
                          "abccczzzabcczzzabccc",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4095
                          "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4096
                          "abzzzabcczzzabccc");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4097
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4098
        checkReplaceAll("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4099
                        "abccczzzabcczzzabccc",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4100
                        "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4101
                        "abzzzabzzzab");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4102
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4103
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4104
        checkReplaceFirst("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4105
                          "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4106
                          "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4107
                          "zzzabzzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4108
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4109
        checkReplaceAll("(?<gn>ab)(c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4110
                        "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4111
                        "${gn}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4112
                        "zzzabzzzabzzzabzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4113
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4114
        checkReplaceFirst("(?<gn1>ab)(?<gn2>c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4115
                          "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4116
                          "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4117
                          "zzzccczzzabcczzzabccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4118
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4119
        checkReplaceAll("(?<gn1>ab)(?<gn2>c*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4120
                        "zzzabccczzzabcczzzabccczzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4121
                        "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4122
                        "zzzccczzzcczzzccczzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4123
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4124
        //toSupplementaries("(ab)(c*)"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4125
        checkReplaceFirst("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4126
                           ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4127
                          toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4128
                          "${gn1}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4129
                          toSupplementaries("abzzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4130
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4131
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4132
        checkReplaceAll("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4133
                        ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4134
                        toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4135
                        "${gn1}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4136
                        toSupplementaries("abzzzabzzzab"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4137
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4138
        checkReplaceFirst("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4139
                           ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4140
                          toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4141
                          "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4142
                          toSupplementaries("ccczzzabcczzzabccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4143
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4144
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4145
        checkReplaceAll("(?<gn1>" + toSupplementaries("ab") +
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4146
                        ")(?<gn2>" + toSupplementaries("c") + "*)",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4147
                        toSupplementaries("abccczzzabcczzzabccc"),
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4148
                        "${gn2}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4149
                        toSupplementaries("ccczzzcczzzccc"));
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4150
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4151
        checkReplaceFirst("(?<dog>Dog)AndCat",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4152
                          "zzzDogAndCatzzzDogAndCatzzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4153
                          "${dog}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4154
                          "zzzDogzzzDogAndCatzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4155
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4156
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4157
        checkReplaceAll("(?<dog>Dog)AndCat",
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4158
                          "zzzDogAndCatzzzDogAndCatzzz",
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4159
                          "${dog}",
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4160
                          "zzzDogzzzDogzzz");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4161
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4162
        // backref in Matcher & String
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4163
        if (!"abcdefghij".replaceFirst("cd(?<gn>ef)gh", "${gn}").equals("abefij") ||
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4164
            !"abbbcbdbefgh".replaceAll("(?<gn>[a-e])b", "${gn}").equals("abcdefgh"))
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4165
            failCount++;
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4166
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4167
        // negative
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4168
        checkExpectedFail("(?<groupnamehasnoascii.in>abc)(def)");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4169
        checkExpectedFail("(?<groupnamehasnoascii_in>abc)(def)");
4161
679d00486dc6 6878475: Better syntax for the named capture group in regex
sherman
parents: 2290
diff changeset
  4170
        checkExpectedFail("(?<6groupnamestartswithdigit>abc)(def)");
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4171
        checkExpectedFail("(?<gname>abc)(def)\\k<gnameX>");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4172
        checkExpectedFail("(?<gname>abc)(?<gname>def)\\k<gnameX>");
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4173
        checkExpectedIAE(Pattern.compile("(?<gname>abc)(def)").matcher("abcdef"),
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4174
                         "gnameX");
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4175
        checkExpectedNPE(Pattern.compile("(?<gname>abc)(def)").matcher("abcdef"));
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4176
        report("NamedGroupCapture");
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4177
    }
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4178
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4179
    // This is for bug 6919132
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4180
    private static void nonBmpClassComplementTest() throws Exception {
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4181
        Pattern p = Pattern.compile("\\P{Lu}");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4182
        Matcher m = p.matcher(new String(new int[] {0x1d400}, 0, 1));
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4183
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4184
        if (m.find() && m.start() == 1)
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4185
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4186
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4187
        // from a unicode category
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4188
        p = Pattern.compile("\\P{Lu}");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4189
        m = p.matcher(new String(new int[] {0x1d400}, 0, 1));
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4190
        if (m.find())
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4191
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4192
        if (!m.hitEnd())
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4193
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4194
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4195
        // block
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4196
        p = Pattern.compile("\\P{InMathematicalAlphanumericSymbols}");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4197
        m = p.matcher(new String(new int[] {0x1d400}, 0, 1));
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4198
        if (m.find() && m.start() == 1)
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4199
            failCount++;
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4200
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4201
        p = Pattern.compile("\\P{sc=GRANTHA}");
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4202
        m = p.matcher(new String(new int[] {0x11350}, 0, 1));
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4203
        if (m.find() && m.start() == 1)
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4204
            failCount++;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4205
4820
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4206
        report("NonBmpClassComplement");
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4207
    }
e32f5d2ba062 6919132: Regex \P{Lu} selects half of a surrogate pari
sherman
parents: 4161
diff changeset
  4208
5610
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4209
    private static void unicodePropertiesTest() throws Exception {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4210
        // different forms
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4211
        if (!Pattern.compile("\\p{IsLu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4212
            !Pattern.compile("\\p{Lu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4213
            !Pattern.compile("\\p{gc=Lu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4214
            !Pattern.compile("\\p{general_category=Lu}").matcher("A").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4215
            !Pattern.compile("\\p{IsLatin}").matcher("B").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4216
            !Pattern.compile("\\p{sc=Latin}").matcher("B").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4217
            !Pattern.compile("\\p{script=Latin}").matcher("B").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4218
            !Pattern.compile("\\p{InBasicLatin}").matcher("c").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4219
            !Pattern.compile("\\p{blk=BasicLatin}").matcher("c").matches() ||
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4220
            !Pattern.compile("\\p{block=BasicLatin}").matcher("c").matches())
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4221
            failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4222
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4223
        Matcher common  = Pattern.compile("\\p{script=Common}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4224
        Matcher unknown = Pattern.compile("\\p{IsUnknown}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4225
        Matcher lastSM  = common;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4226
        Character.UnicodeScript lastScript = Character.UnicodeScript.of(0);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4227
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4228
        Matcher latin  = Pattern.compile("\\p{block=basic_latin}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4229
        Matcher greek  = Pattern.compile("\\p{InGreek}").matcher("");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4230
        Matcher lastBM = latin;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4231
        Character.UnicodeBlock lastBlock = Character.UnicodeBlock.of(0);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4232
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4233
        for (int cp = 1; cp < Character.MAX_CODE_POINT; cp++) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4234
            if (cp >= 0x30000 && (cp & 0x70) == 0){
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4235
                continue;  // only pick couple code points, they are the same
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4236
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4237
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4238
            // Unicode Script
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4239
            Character.UnicodeScript script = Character.UnicodeScript.of(cp);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4240
            Matcher m;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4241
            String str = new String(Character.toChars(cp));
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4242
            if (script == lastScript) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4243
                 m = lastSM;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4244
                 m.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4245
            } else {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4246
                 m  = Pattern.compile("\\p{Is" + script.name() + "}").matcher(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4247
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4248
            if (!m.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4249
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4250
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4251
            Matcher other = (script == Character.UnicodeScript.COMMON)? unknown : common;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4252
            other.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4253
            if (other.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4254
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4255
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4256
            lastSM = m;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4257
            lastScript = script;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4258
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4259
            // Unicode Block
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4260
            Character.UnicodeBlock block = Character.UnicodeBlock.of(cp);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4261
            if (block == null) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4262
                //System.out.printf("Not a Block: cp=%x%n", cp);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4263
                continue;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4264
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4265
            if (block == lastBlock) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4266
                 m = lastBM;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4267
                 m.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4268
            } else {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4269
                 m  = Pattern.compile("\\p{block=" + block.toString() + "}").matcher(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4270
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4271
            if (!m.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4272
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4273
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4274
            other = (block == Character.UnicodeBlock.BASIC_LATIN)? greek : latin;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4275
            other.reset(str);
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4276
            if (other.matches()) {
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4277
                failCount++;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4278
            }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4279
            lastBM = m;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4280
            lastBlock = block;
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4281
        }
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4282
        report("unicodeProperties");
fd2427610c7f 6945564: Unicode script support in Character class
sherman
parents: 5295
diff changeset
  4283
    }
8173
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4284
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4285
    private static void unicodeHexNotationTest() throws Exception {
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4286
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4287
        // negative
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4288
        checkExpectedFail("\\x{-23}");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4289
        checkExpectedFail("\\x{110000}");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4290
        checkExpectedFail("\\x{}");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4291
        checkExpectedFail("\\x{AB[ef]");
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4292
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4293
        // codepoint
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4294
        check("^\\x{1033c}$",              "\uD800\uDF3C", true);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4295
        check("^\\xF0\\x90\\x8C\\xBC$",    "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4296
        check("^\\x{D800}\\x{DF3c}+$",     "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4297
        check("^\\xF0\\x90\\x8C\\xBC$",    "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4298
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4299
        // in class
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4300
        check("^[\\x{D800}\\x{DF3c}]+$",   "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4301
        check("^[\\xF0\\x90\\x8C\\xBC]+$", "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4302
        check("^[\\x{D800}\\x{DF3C}]+$",   "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4303
        check("^[\\x{DF3C}\\x{D800}]+$",   "\uD800\uDF3C", false);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4304
        check("^[\\x{D800}\\x{DF3C}]+$",   "\uDF3C\uD800", true);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4305
        check("^[\\x{DF3C}\\x{D800}]+$",   "\uDF3C\uD800", true);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4306
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4307
        for (int cp = 0; cp <= 0x10FFFF; cp++) {
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4308
             String s = "A" + new String(Character.toChars(cp)) + "B";
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4309
             String hexUTF16 = (cp <= 0xFFFF)? String.format("\\u%04x", cp)
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4310
                                             : String.format("\\u%04x\\u%04x",
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4311
                                               (int) Character.toChars(cp)[0],
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4312
                                               (int) Character.toChars(cp)[1]);
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4313
             String hexCodePoint = "\\x{" + Integer.toHexString(cp) + "}";
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4314
             if (!Pattern.matches("A" + hexUTF16 + "B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4315
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4316
             if (!Pattern.matches("A[" + hexUTF16 + "]B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4317
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4318
             if (!Pattern.matches("A" + hexCodePoint + "B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4319
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4320
             if (!Pattern.matches("A[" + hexCodePoint + "]B", s))
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4321
                 failCount++;
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4322
         }
a3a39b98e05a 7014645: Support perl style Unicode hex notation \x{...}
sherman
parents: 7668
diff changeset
  4323
         report("unicodeHexNotation");
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4324
    }
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4325
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4326
    private static void unicodeClassesTest() throws Exception {
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4327
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4328
        Matcher lower  = Pattern.compile("\\p{Lower}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4329
        Matcher upper  = Pattern.compile("\\p{Upper}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4330
        Matcher ASCII  = Pattern.compile("\\p{ASCII}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4331
        Matcher alpha  = Pattern.compile("\\p{Alpha}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4332
        Matcher digit  = Pattern.compile("\\p{Digit}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4333
        Matcher alnum  = Pattern.compile("\\p{Alnum}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4334
        Matcher punct  = Pattern.compile("\\p{Punct}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4335
        Matcher graph  = Pattern.compile("\\p{Graph}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4336
        Matcher print  = Pattern.compile("\\p{Print}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4337
        Matcher blank  = Pattern.compile("\\p{Blank}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4338
        Matcher cntrl  = Pattern.compile("\\p{Cntrl}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4339
        Matcher xdigit = Pattern.compile("\\p{XDigit}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4340
        Matcher space  = Pattern.compile("\\p{Space}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4341
        Matcher bound  = Pattern.compile("\\b").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4342
        Matcher word   = Pattern.compile("\\w++").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4343
        // UNICODE_CHARACTER_CLASS
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4344
        Matcher lowerU  = Pattern.compile("\\p{Lower}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4345
        Matcher upperU  = Pattern.compile("\\p{Upper}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4346
        Matcher ASCIIU  = Pattern.compile("\\p{ASCII}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4347
        Matcher alphaU  = Pattern.compile("\\p{Alpha}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4348
        Matcher digitU  = Pattern.compile("\\p{Digit}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4349
        Matcher alnumU  = Pattern.compile("\\p{Alnum}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4350
        Matcher punctU  = Pattern.compile("\\p{Punct}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4351
        Matcher graphU  = Pattern.compile("\\p{Graph}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4352
        Matcher printU  = Pattern.compile("\\p{Print}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4353
        Matcher blankU  = Pattern.compile("\\p{Blank}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4354
        Matcher cntrlU  = Pattern.compile("\\p{Cntrl}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4355
        Matcher xdigitU = Pattern.compile("\\p{XDigit}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4356
        Matcher spaceU  = Pattern.compile("\\p{Space}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4357
        Matcher boundU  = Pattern.compile("\\b", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4358
        Matcher wordU   = Pattern.compile("\\w", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4359
        // embedded flag (?U)
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4360
        Matcher lowerEU  = Pattern.compile("(?U)\\p{Lower}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4361
        Matcher graphEU  = Pattern.compile("(?U)\\p{Graph}", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4362
        Matcher wordEU   = Pattern.compile("(?U)\\w", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4363
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4364
        Matcher bwb    = Pattern.compile("\\b\\w\\b").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4365
        Matcher bwbU   = Pattern.compile("\\b\\w++\\b", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4366
        Matcher bwbEU  = Pattern.compile("(?U)\\b\\w++\\b", Pattern.UNICODE_CHARACTER_CLASS).matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4367
        // properties
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4368
        Matcher lowerP  = Pattern.compile("\\p{IsLowerCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4369
        Matcher upperP  = Pattern.compile("\\p{IsUpperCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4370
        Matcher titleP  = Pattern.compile("\\p{IsTitleCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4371
        Matcher letterP = Pattern.compile("\\p{IsLetter}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4372
        Matcher alphaP  = Pattern.compile("\\p{IsAlphabetic}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4373
        Matcher ideogP  = Pattern.compile("\\p{IsIdeographic}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4374
        Matcher cntrlP  = Pattern.compile("\\p{IsControl}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4375
        Matcher spaceP  = Pattern.compile("\\p{IsWhiteSpace}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4376
        Matcher definedP = Pattern.compile("\\p{IsAssigned}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4377
        Matcher nonCCPP = Pattern.compile("\\p{IsNoncharacterCodePoint}").matcher("");
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4378
        Matcher joinCrtl = Pattern.compile("\\p{IsJoinControl}").matcher("");
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4379
        // javaMethod
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4380
        Matcher lowerJ  = Pattern.compile("\\p{javaLowerCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4381
        Matcher upperJ  = Pattern.compile("\\p{javaUpperCase}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4382
        Matcher alphaJ  = Pattern.compile("\\p{javaAlphabetic}").matcher("");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4383
        Matcher ideogJ  = Pattern.compile("\\p{javaIdeographic}").matcher("");
38450
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4384
        // GC/C
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4385
        Matcher gcC  = Pattern.compile("\\p{C}").matcher("");
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4386
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4387
        for (int cp = 1; cp < 0x30000; cp++) {
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4388
            String str = new String(Character.toChars(cp));
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4389
            int type = Character.getType(cp);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4390
            if (// lower
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4391
                POSIX_ASCII.isLower(cp)   != lower.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4392
                Character.isLowerCase(cp) != lowerU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4393
                Character.isLowerCase(cp) != lowerP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4394
                Character.isLowerCase(cp) != lowerEU.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4395
                Character.isLowerCase(cp) != lowerJ.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4396
                // upper
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4397
                POSIX_ASCII.isUpper(cp)   != upper.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4398
                POSIX_Unicode.isUpper(cp) != upperU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4399
                Character.isUpperCase(cp) != upperP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4400
                Character.isUpperCase(cp) != upperJ.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4401
                // alpha
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4402
                POSIX_ASCII.isAlpha(cp)   != alpha.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4403
                POSIX_Unicode.isAlpha(cp) != alphaU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4404
                Character.isAlphabetic(cp)!= alphaP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4405
                Character.isAlphabetic(cp)!= alphaJ.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4406
                // digit
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4407
                POSIX_ASCII.isDigit(cp)   != digit.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4408
                Character.isDigit(cp)     != digitU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4409
                // alnum
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4410
                POSIX_ASCII.isAlnum(cp)   != alnum.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4411
                POSIX_Unicode.isAlnum(cp) != alnumU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4412
                // punct
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4413
                POSIX_ASCII.isPunct(cp)   != punct.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4414
                POSIX_Unicode.isPunct(cp) != punctU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4415
                // graph
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4416
                POSIX_ASCII.isGraph(cp)   != graph.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4417
                POSIX_Unicode.isGraph(cp) != graphU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4418
                POSIX_Unicode.isGraph(cp) != graphEU.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4419
                // blank
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4420
                POSIX_ASCII.isType(cp, POSIX_ASCII.BLANK)
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4421
                                          != blank.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4422
                POSIX_Unicode.isBlank(cp) != blankU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4423
                // print
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4424
                POSIX_ASCII.isPrint(cp)   != print.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4425
                POSIX_Unicode.isPrint(cp) != printU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4426
                // cntrl
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4427
                POSIX_ASCII.isCntrl(cp)   != cntrl.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4428
                POSIX_Unicode.isCntrl(cp) != cntrlU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4429
                (Character.CONTROL == type) != cntrlP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4430
                // hexdigit
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4431
                POSIX_ASCII.isHexDigit(cp)   != xdigit.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4432
                POSIX_Unicode.isHexDigit(cp) != xdigitU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4433
                // space
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4434
                POSIX_ASCII.isSpace(cp)   != space.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4435
                POSIX_Unicode.isSpace(cp) != spaceU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4436
                POSIX_Unicode.isSpace(cp) != spaceP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4437
                // word
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4438
                POSIX_ASCII.isWord(cp)   != word.reset(str).matches()  ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4439
                POSIX_Unicode.isWord(cp) != wordU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4440
                POSIX_Unicode.isWord(cp) != wordEU.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4441
                // bwordb
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4442
                POSIX_ASCII.isWord(cp) != bwb.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4443
                POSIX_Unicode.isWord(cp) != bwbU.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4444
                // properties
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4445
                Character.isTitleCase(cp) != titleP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4446
                Character.isLetter(cp)    != letterP.reset(str).matches()||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4447
                Character.isIdeographic(cp) != ideogP.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4448
                Character.isIdeographic(cp) != ideogJ.reset(str).matches() ||
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4449
                (Character.UNASSIGNED == type) == definedP.reset(str).matches() ||
17434
4a04d7127e80 8013252: Regex Matcher .start and .end should be accessible by group name
sherman
parents: 17183
diff changeset
  4450
                POSIX_Unicode.isNoncharacterCodePoint(cp) != nonCCPP.reset(str).matches() ||
38450
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4451
                POSIX_Unicode.isJoinControl(cp) != joinCrtl.reset(str).matches() ||
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4452
                // gc_C
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4453
                (Character.CONTROL == type || Character.FORMAT == type ||
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4454
                 Character.PRIVATE_USE == type || Character.SURROGATE == type ||
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4455
                 Character.UNASSIGNED == type)
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4456
                != gcC.reset(str).matches()) {
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4457
                failCount++;
38450
516990ff3a4c 8143282: \p{Cn} unassigned code points should be included in \p{C}
sherman
parents: 37882
diff changeset
  4458
            }
9536
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4459
        }
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4460
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4461
        // bounds/word align
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4462
        twoFindIndexes(" \u0180sherman\u0400 ", bound, 1, 10);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4463
        if (!bwbU.reset("\u0180sherman\u0400").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4464
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4465
        twoFindIndexes(" \u0180sh\u0345erman\u0400 ", bound, 1, 11);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4466
        if (!bwbU.reset("\u0180sh\u0345erman\u0400").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4467
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4468
        twoFindIndexes(" \u0724\u0739\u0724 ", bound, 1, 4);
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4469
        if (!bwbU.reset("\u0724\u0739\u0724").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4470
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4471
        if (!bwbEU.reset("\u0724\u0739\u0724").matches())
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4472
            failCount++;
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4473
        report("unicodePredefinedClasses");
648c9add2a74 7039066: j.u.rgex does not match TR18 RL1.4 Simple Word Boundaries and RL1.2 Properties
sherman
parents: 9035
diff changeset
  4474
    }
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4475
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4476
    private static void unicodeCharacterNameTest() throws Exception {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4477
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4478
        for (int cp = 0; cp < Character.MAX_CODE_POINT; cp++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4479
            if (!Character.isValidCodePoint(cp) ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4480
                Character.getType(cp) == Character.UNASSIGNED)
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4481
                continue;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4482
            String str = new String(Character.toChars(cp));
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4483
            // single
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4484
            String p = "\\N{" + Character.getName(cp) + "}";
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4485
            if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4486
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4487
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4488
            // class[c]
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4489
            p = "[\\N{" + Character.getName(cp) + "}]";
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4490
            if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4491
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4492
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4493
        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4494
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4495
        // range
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4496
        for (int i = 0; i < 10; i++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4497
            int start = generator.nextInt(20);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4498
            int end = start + generator.nextInt(200);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4499
            String p = "[\\N{" + Character.getName(start) + "}-\\N{" + Character.getName(end) + "}]";
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4500
            String str;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4501
            for (int cp = start; cp < end; cp++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4502
                str = new String(Character.toChars(cp));
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4503
                if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4504
                    failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4505
                }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4506
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4507
            str = new String(Character.toChars(end + 10));
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4508
            if (Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4509
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4510
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4511
        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4512
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4513
        // slice
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4514
        for (int i = 0; i < 10; i++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4515
            int n = generator.nextInt(256);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4516
            int[] buf = new int[n];
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4517
            StringBuffer sb = new StringBuffer(1024);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4518
            for (int j = 0; j < n; j++) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4519
                int cp = generator.nextInt(1000);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4520
                if (!Character.isValidCodePoint(cp) ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4521
                    Character.getType(cp) == Character.UNASSIGNED)
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4522
                    cp = 0x4e00;    // just use 4e00
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4523
                sb.append("\\N{" + Character.getName(cp) + "}");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4524
                buf[j] = cp;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4525
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4526
            String p = sb.toString();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4527
            String str = new String(buf, 0, buf.length);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4528
            if (!Pattern.compile(p).matcher(str).matches()) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4529
                failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4530
            }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4531
        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4532
        report("unicodeCharacterName");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4533
    }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4534
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4535
    private static void horizontalAndVerticalWSTest() throws Exception {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4536
        String hws = new String (new char[] {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4537
                                     0x09, 0x20, 0xa0, 0x1680, 0x180e,
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4538
                                     0x2000, 0x2001, 0x2002, 0x2003, 0x2004, 0x2005,
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4539
                                     0x2006, 0x2007, 0x2008, 0x2009, 0x200a,
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4540
                                     0x202f, 0x205f, 0x3000 });
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4541
        String vws = new String (new char[] {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4542
                                     0x0a, 0x0b, 0x0c, 0x0d, 0x85, 0x2028, 0x2029 });
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4543
        if (!Pattern.compile("\\h+").matcher(hws).matches() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4544
            !Pattern.compile("[\\h]+").matcher(hws).matches())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4545
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4546
        if (Pattern.compile("\\H").matcher(hws).find() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4547
            Pattern.compile("[\\H]").matcher(hws).find())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4548
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4549
        if (!Pattern.compile("\\v+").matcher(vws).matches() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4550
            !Pattern.compile("[\\v]+").matcher(vws).matches())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4551
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4552
        if (Pattern.compile("\\V").matcher(vws).find() ||
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4553
            Pattern.compile("[\\V]").matcher(vws).find())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4554
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4555
        String prefix = "abcd";
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4556
        String suffix = "efgh";
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4557
        String ng = "A";
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4558
        for (int i = 0; i < hws.length(); i++) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4559
            String c = String.valueOf(hws.charAt(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4560
            Matcher m = Pattern.compile("\\h").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4561
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4562
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4563
            m = Pattern.compile("[\\h]").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4564
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4565
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4566
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4567
            m = Pattern.compile("\\H").matcher(hws.substring(0, i) + ng + hws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4568
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4569
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4570
            m = Pattern.compile("[\\H]").matcher(hws.substring(0, i) + ng + hws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4571
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4572
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4573
        }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4574
        for (int i = 0; i < vws.length(); i++) {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4575
            String c = String.valueOf(vws.charAt(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4576
            Matcher m = Pattern.compile("\\v").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4577
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4578
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4579
            m = Pattern.compile("[\\v]").matcher(prefix + c + suffix);
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4580
            if (!m.find() || !c.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4581
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4582
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4583
            m = Pattern.compile("\\V").matcher(vws.substring(0, i) + ng + vws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4584
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4585
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4586
            m = Pattern.compile("[\\V]").matcher(vws.substring(0, i) + ng + vws.substring(i));
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4587
            if (!m.find() || !ng.equals(m.group()))
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4588
                failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4589
        }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4590
        // \v in range is interpreted as 0x0B. This is the undocumented behavior
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4591
        if (!Pattern.compile("[\\v-\\v]").matcher(String.valueOf((char)0x0B)).matches())
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4592
            failCount++;
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4593
        report("horizontalAndVerticalWSTest");
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4594
    }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4595
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4596
    private static void linebreakTest() throws Exception {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4597
        String linebreaks = new String (new char[] {
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4598
            0x0A, 0x0B, 0x0C, 0x0D, 0x85, 0x2028, 0x2029 });
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4599
        String crnl = "\r\n";
44122
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4600
        if (!(Pattern.compile("\\R+").matcher(linebreaks).matches() &&
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4601
              Pattern.compile("\\R").matcher(crnl).matches() &&
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4602
              Pattern.compile("\\Rabc").matcher(crnl + "abc").matches() &&
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4603
              Pattern.compile("\\Rabc").matcher("\rabc").matches() &&
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4604
              Pattern.compile("\\R\\R").matcher(crnl).matches() &&  // backtracking
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4605
              Pattern.compile("\\R\\n").matcher(crnl).matches()) && // backtracking
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4606
              !Pattern.compile("((?<!\\R)\\s)*").matcher(crnl).matches()) { // #8176029
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4607
            failCount++;
65a14579a2ae 8176029: Linebreak matcher is not equivalent to the pattern as stated in javadoc
sherman
parents: 38777
diff changeset
  4608
        }
12675
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4609
        report("linebreakTest");
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4610
    }
3b7d71495649 7014640: To add a metachar \R for line ending and character classes for vertical/horizontal ws \v \V \h \H
sherman
parents: 12432
diff changeset
  4611
13554
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4612
    // #7189363
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4613
    private static void branchTest() throws Exception {
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4614
        if (!Pattern.compile("(a)?bc|d").matcher("d").find() ||     // greedy
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4615
            !Pattern.compile("(a)+bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4616
            !Pattern.compile("(a)*bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4617
            !Pattern.compile("(a)??bc|d").matcher("d").find() ||    // reluctant
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4618
            !Pattern.compile("(a)+?bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4619
            !Pattern.compile("(a)*?bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4620
            !Pattern.compile("(a)?+bc|d").matcher("d").find() ||    // possessive
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4621
            !Pattern.compile("(a)++bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4622
            !Pattern.compile("(a)*+bc|d").matcher("d").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4623
            !Pattern.compile("(a)?bc|d").matcher("d").matches() ||  // greedy
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4624
            !Pattern.compile("(a)+bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4625
            !Pattern.compile("(a)*bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4626
            !Pattern.compile("(a)??bc|d").matcher("d").matches() || // reluctant
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4627
            !Pattern.compile("(a)+?bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4628
            !Pattern.compile("(a)*?bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4629
            !Pattern.compile("(a)?+bc|d").matcher("d").matches() || // possessive
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4630
            !Pattern.compile("(a)++bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4631
            !Pattern.compile("(a)*+bc|d").matcher("d").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4632
            !Pattern.compile("(a)?bc|de").matcher("de").find() ||   // others
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4633
            !Pattern.compile("(a)??bc|de").matcher("de").find() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4634
            !Pattern.compile("(a)?bc|de").matcher("de").matches() ||
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4635
            !Pattern.compile("(a)??bc|de").matcher("de").matches())
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4636
            failCount++;
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4637
        report("branchTest");
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4638
    }
ad737436c54a 7189363: Regex Pattern compilation buggy for special sequences
sherman
parents: 12675
diff changeset
  4639
17183
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4640
    // This test is for 8007395
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4641
    private static void groupCurlyNotFoundSuppTest() throws Exception {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4642
        String input = "test this as \ud83d\ude0d";
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4643
        for (String pStr : new String[] { "test(.)+(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4644
                                          "test(.)*(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4645
                                          "test([^B])+(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4646
                                          "test([^B])*(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4647
                                          "test(\\P{IsControl})+(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4648
                                          "test(\\P{IsControl})*(@[a-zA-Z.]+)",
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4649
                                        }) {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4650
            Matcher m = Pattern.compile(pStr, Pattern.CASE_INSENSITIVE)
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4651
                               .matcher(input);
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4652
            try {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4653
                if (m.find()) {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4654
                    failCount++;
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4655
                }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4656
            } catch (Exception x) {
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4657
                failCount++;
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4658
            }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4659
        }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4660
        report("GroupCurly NotFoundSupp");
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4661
    }
1e21e0bc10e7 8007395: StringIndexOutofBoundsException in Match.find() when input String contains surrogate UTF-16 characters
sherman
parents: 14342
diff changeset
  4662
19604
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4663
    // This test is for 8023647
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4664
    private static void groupCurlyBackoffTest() throws Exception {
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4665
        if (!"abc1c".matches("(\\w)+1\\1") ||
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4666
            "abc11".matches("(\\w)+1\\1")) {
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4667
            failCount++;
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4668
        }
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4669
        report("GroupCurly backoff");
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4670
    }
f96e3aef2081 8023647: "abc1c".matches("(\\w)+1\\1")) returns false
sherman
parents: 17447
diff changeset
  4671
17447
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4672
    // This test is for 8012646
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4673
    private static void patternAsPredicate() throws Exception {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4674
        Predicate<String> p = Pattern.compile("[a-z]+").asPredicate();
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4675
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4676
        if (p.test("")) {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4677
            failCount++;
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4678
        }
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4679
        if (!p.test("word")) {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4680
            failCount++;
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4681
        }
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4682
        if (p.test("1234")) {
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4683
            failCount++;
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4684
        }
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4685
        report("Pattern.asPredicate");
3031deba3fbe 8012646: Pattern.splitAsStream
psandoz
parents: 17434
diff changeset
  4686
    }
25523
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4687
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4688
    // This test is for 8035975
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4689
    private static void invalidFlags() throws Exception {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4690
        for (int flag = 1; flag != 0; flag <<= 1) {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4691
            switch (flag) {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4692
            case Pattern.CASE_INSENSITIVE:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4693
            case Pattern.MULTILINE:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4694
            case Pattern.DOTALL:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4695
            case Pattern.UNICODE_CASE:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4696
            case Pattern.CANON_EQ:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4697
            case Pattern.UNIX_LINES:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4698
            case Pattern.LITERAL:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4699
            case Pattern.UNICODE_CHARACTER_CLASS:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4700
            case Pattern.COMMENTS:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4701
                // valid flag, continue
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4702
                break;
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4703
            default:
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4704
                try {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4705
                    Pattern.compile(".", flag);
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4706
                    failCount++;
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4707
                } catch (IllegalArgumentException expected) {
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4708
                }
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4709
            }
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4710
        }
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4711
        report("Invalid compile flags");
c751d1010164 8035975: Pattern.compile(String, int) fails to throw IllegalArgumentException
igerasim
parents: 23734
diff changeset
  4712
    }
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4713
38777
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4714
    // This test is for 8158482
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4715
    private static void embeddedFlags() throws Exception {
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4716
        try {
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4717
            Pattern.compile("(?i).(?-i).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4718
            Pattern.compile("(?m).(?-m).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4719
            Pattern.compile("(?s).(?-s).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4720
            Pattern.compile("(?d).(?-d).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4721
            Pattern.compile("(?u).(?-u).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4722
            Pattern.compile("(?c).(?-c).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4723
            Pattern.compile("(?x).(?-x).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4724
            Pattern.compile("(?U).(?-U).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4725
            Pattern.compile("(?imsducxU).(?-imsducxU).");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4726
        } catch (PatternSyntaxException x) {
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4727
            failCount++;
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4728
        }
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4729
        report("Embedded flags");
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4730
    }
826eb7091523 8158482: regex UNICODE_CHARACTER_CLASS flag cannot be disabled with an embedded flag expression
sherman
parents: 38450
diff changeset
  4731
35783
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4732
    private static void grapheme() throws Exception {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4733
        Files.lines(Paths.get(System.getProperty("test.src", "."),
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4734
                              "GraphemeBreakTest.txt"))
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4735
            .filter( ln -> ln.length() != 0 && !ln.startsWith("#") )
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4736
            .forEach( ln -> {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4737
                    ln = ln.replaceAll("\\s+|\\([a-zA-Z]+\\)|\\[[a-zA-Z]]+\\]|#.*", "");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4738
                    // System.out.println(str);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4739
                    String[] strs = ln.split("\u00f7|\u00d7");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4740
                    StringBuilder src = new StringBuilder();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4741
                    ArrayList<String> graphemes = new ArrayList<>();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4742
                    StringBuilder buf = new StringBuilder();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4743
                    int offBk = 0;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4744
                    for (String str : strs) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4745
                        if (str.length() == 0)  // first empty str
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4746
                            continue;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4747
                        int cp = Integer.parseInt(str, 16);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4748
                        src.appendCodePoint(cp);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4749
                        buf.appendCodePoint(cp);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4750
                        offBk += (str.length() + 1);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4751
                        if (ln.charAt(offBk) == '\u00f7') {    // DIV
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4752
                            graphemes.add(buf.toString());
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4753
                            buf = new StringBuilder();
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4754
                        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4755
                    }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4756
                    Pattern p = Pattern.compile("\\X");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4757
                    Matcher m = p.matcher(src.toString());
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4758
                    Scanner s = new Scanner(src.toString()).useDelimiter("\\b{g}");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4759
                    for (String g : graphemes) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4760
                        // System.out.printf("     grapheme:=[%s]%n", g);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4761
                        // (1) test \\X directly
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4762
                        if (!m.find() || !m.group().equals(g)) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4763
                            System.out.println("Failed \\X [" + ln + "] : " + g);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4764
                            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4765
                        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4766
                        // (2) test \\b{g} + \\X  via Scanner
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4767
                        boolean hasNext = s.hasNext(p);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4768
                        // if (!s.hasNext() || !s.next().equals(next)) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4769
                        if (!s.hasNext(p) || !s.next(p).equals(g)) {
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4770
                            System.out.println("Failed b{g} [" + ln + "] : " + g);
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4771
                            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4772
                        }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4773
                    }
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4774
                });
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4775
        // some sanity checks
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4776
        if (!Pattern.compile("\\X{10}").matcher("abcdefghij").matches() ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4777
            !Pattern.compile("\\b{g}(?:\\X\\b{g}){5}\\b{g}").matcher("abcde").matches() ||
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4778
            !Pattern.compile("(?:\\X\\b{g}){2}").matcher("\ud800\udc00\ud801\udc02").matches())
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4779
            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4780
        // make sure "\b{n}" still works
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4781
        if (!Pattern.compile("\\b{1}hello\\b{1} \\b{1}world\\b{1}").matcher("hello world").matches())
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4782
            failCount++;
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4783
        report("Unicode extended grapheme cluster");
2690535d72cc 7071819: To support Extended Grapheme Clusters in Regex
sherman
parents: 34436
diff changeset
  4784
    }
37882
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4785
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4786
    // hangup/timeout if go into exponential backtracking
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4787
    private static void expoBacktracking() throws Exception {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4788
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4789
        Object[][] patternMatchers = {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4790
            // 6328855
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4791
            { "(.*\n*)*",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4792
              "this little fine string lets\r\njava.lang.String.matches\r\ncrash\r\n(We don't know why but adding \r* to the regex makes it work again)",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4793
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4794
            // 6192895
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4795
            { " *([a-zA-Z0-9/\\-\\?:\\(\\)\\.,'\\+\\{\\}]+ *)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4796
              "Hello World this is a test this is a test this is a test A",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4797
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4798
            { " *([a-zA-Z0-9/\\-\\?:\\(\\)\\.,'\\+\\{\\}]+ *)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4799
              "Hello World this is a test this is a test this is a test \u4e00 ",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4800
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4801
            { " *([a-z0-9]+ *)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4802
              "hello world this is a test this is a test this is a test A",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4803
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4804
            // 4771934 [FIXED] #5013651?
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4805
            { "^(\\w+([\\.-]?\\w+)*@\\w+([\\.-]?\\w+)*(\\.\\w{2,4})+[,;]?)+$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4806
              "abc@efg.abc,efg@abc.abc,abc@xyz.mno;abc@sdfsd.com",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4807
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4808
            // 4866249 [FIXED]
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4809
            { "<\\s*" + "(meta|META)" + "(\\s|[^>])+" + "(CHARSET|charset)=" + "(\\s|[^>])+>",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4810
              "<META http-equiv=\"Content-Type\" content=\"text/html; charset=ISO-8859-5\">",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4811
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4812
            { "^(\\w+([\\.-]?\\w+)*@\\w+([\\.-]?\\w+)*(\\.\\w{2,4})+[,;]?)+$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4813
              "abc@efg.abc,efg@abc.abc,abc@xyz.mno;sdfsd.com",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4814
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4815
            // 6345469
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4816
            { "((<[^>]+>)?(((\\s)?)*(\\&nbsp;)?)*((\\s)?)*)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4817
              "&nbsp;&nbsp; < br/> &nbsp; < / p> <p> <html> <adfasfdasdf>&nbsp; </p>",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4818
              true }, // --> matched
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4819
            { "((<[^>]+>)?(((\\s)?)*(\\&nbsp;)?)*((\\s)?)*)+",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4820
              "&nbsp;&nbsp; < br/> &nbsp; < / p> <p> <html> <adfasfdasdf>&nbsp; p </p>",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4821
              false },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4822
            // 5026912
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4823
            { "^\\s*" + "(\\w|\\d|[\\xC0-\\xFF]|/)+" + "\\s+|$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4824
              "156580451111112225588087755221111111566969655555555",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4825
              false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4826
            // 6988218
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4827
            { "^([+-]?((0[xX](\\p{XDigit}+))|(((\\p{Digit}+)(\\.)?((\\p{Digit}+)?)([eE][+-]?(\\p{Digit}+))?)|(\\.((\\p{Digit}+))([eE][+-]?(\\p{Digit}+))?)))|[n|N]?'([^']*(?:'')*[^']*)*')",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4828
              "'%)) order by ANGEBOT.ID",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4829
              false},    // find
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4830
            // 6693451
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4831
            { "^(\\s*foo\\s*)*$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4832
              "foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4833
              true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4834
            { "^(\\s*foo\\s*)*$",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4835
              "foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo foo fo",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4836
              false
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4837
            },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4838
            // 7006761
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4839
            { "(([0-9A-Z]+)([_]?+)*)*", "FOOOOO_BAAAR_FOOOOOOOOO_BA_", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4840
            { "(([0-9A-Z]+)([_]?+)*)*", "FOOOOO_BAAAR_FOOOOOOOOO_BA_ ", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4841
            // 8140212
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4842
            { "(?<before>.*)\\{(?<reflection>\\w+):(?<innerMethod>\\w+(\\.?\\w+(\\(((?<args>(('[^']*')|((/|\\w)+))(,(('[^']*')|((/|\\w)+)))*))?\\))?)*)\\}(?<after>.*)",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4843
              "{CeGlobal:getSodCutoff.getGui.getAmqp.getSimpleModeEnabled()",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4844
              false
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4845
            },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4846
            { "^(a+)+$", "aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4847
            { "^(a+)+$", "aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa!", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4848
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4849
            { "(x+)*y",  "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxy", true },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4850
            { "(x+)*y",  "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxz", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4851
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4852
            { "(x+x+)+y", "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxy", true},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4853
            { "(x+x+)+y", "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxz", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4854
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4855
            { "(([0-9A-Z]+)([_]?+)*)*", "--------------------------------------", false},
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4856
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4857
            /* not fixed
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4858
            //8132141   --->    second level exponential backtracking
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4859
            { "(h|h|ih(((i|a|c|c|a|i|i|j|b|a|i|b|a|a|j))+h)ahbfhba|c|i)*",
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4860
              "hchcchicihcchciiicichhcichcihcchiihichiciiiihhcchicchhcihchcihiihciichhccciccichcichiihcchcihhicchcciicchcccihiiihhihihihichicihhcciccchihhhcchichchciihiicihciihcccciciccicciiiiiiiiicihhhiiiihchccchchhhhiiihchihcccchhhiiiiiiiicicichicihcciciihichhhhchihciiihhiccccccciciihhichiccchhicchicihihccichicciihcichccihhiciccccccccichhhhihihhcchchihihiihhihihihicichihiiiihhhhihhhchhichiicihhiiiiihchccccchichci" },
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4861
            */
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4862
        };
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4863
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4864
        for (Object[] pm : patternMatchers) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4865
            String p = (String)pm[0];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4866
            String s = (String)pm[1];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4867
            boolean r = (Boolean)pm[2];
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4868
            if (r != Pattern.compile(p).matcher(s).matches()) {
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4869
                failCount++;
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4870
            }
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4871
        }
e7f3cf12e739 6328855: String: Matches hangs at short and easy Strings containing \r \n
sherman
parents: 35783
diff changeset
  4872
    }
2070
6e9972fbd965 6350801: Add support for named (instead of numbered) capture groups in regular expression
sherman
parents:
diff changeset
  4873
}