test/jdk/java/lang/String/SpecialCasingTest.java
author jlaskey
Fri, 18 May 2018 08:43:49 -0300
changeset 50175 589ed2770141
parent 50045 d9d55f64d136
child 55013 8dae495a59e7
permissions -rw-r--r--
8200436: String::isBlank Reviewed-by: sundar
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
50045
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
     1
/*
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
     2
 * Copyright (c) 2018, Oracle and/or its affiliates. All rights reserved.
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
     4
 *
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
     7
 * published by the Free Software Foundation.  Oracle designates this
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
     8
 * particular file as subject to the "Classpath" exception as provided
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
     9
 * by Oracle in the LICENSE file that accompanied this code.
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    10
 *
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    11
 * This code is distributed in the hope that it will be useful, but WITHOUT
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    12
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    13
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    14
 * version 2 for more details (a copy is included in the LICENSE file that
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    15
 * accompanied this code).
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    16
 *
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    17
 * You should have received a copy of the GNU General Public License version
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    18
 * 2 along with this work; if not, write to the Free Software Foundation,
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    19
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    20
 *
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    21
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    22
 * or visit www.oracle.com if you need additional information or have any
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    23
 * questions.
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    24
 */
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    25
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    26
/*
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    27
 * @test
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    28
 * @bug 4397357 6565620 6959267 7070436 7198195 8041791 8032446 8072600
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    29
 * @summary Confirm special case mappings are handled correctly.
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    30
 */
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    31
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    32
import java.io.BufferedReader;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    33
import java.io.IOException;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    34
import java.nio.file.Files;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    35
import java.nio.file.Paths;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    36
import java.util.ArrayList;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    37
import java.util.List;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    38
import java.util.Locale;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    39
import java.util.StringTokenizer;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    40
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    41
public class SpecialCasingTest {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    42
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    43
    private static boolean err = false;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    44
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    45
    // Locales which are used for testing
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    46
    private static List<Locale> locales = new ArrayList<>();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    47
    static {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    48
        locales.add(new Locale("az", ""));
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    49
        locales.addAll(java.util.Arrays.asList(Locale.getAvailableLocales()));
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    50
    }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    51
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    52
    // Default locale
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    53
    private static String defaultLang;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    54
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    55
    // True if the default language is az, lt, or tr which has locale-specific
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    56
    // mappings.
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    57
    private static boolean specificLocale;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    58
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    59
    // Additional test cases
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    60
    //   Pseudo-locales which are used here:
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    61
    //     L1: locales other than lt
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    62
    //     L2: locales other than az and tr
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    63
    //     L3: locales other than az, lt and tr
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    64
    private static final String[] additionalTestData = {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    65
        // Format:
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    66
        //   <code>; <lower>; <title>; <upper>; (<condition_list>)
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    67
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    68
        // Counterpart of Final_Sigma test case
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    69
        //   03A3; 03C2; 03A3; 03A3; Final_Sigma
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    70
            "03A3; 03C3; 03A3; 03A3; SunSpecific_Not_Final_Sigma1",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    71
            "03A3; 03C3; 03A3; 03A3; SunSpecific_Not_Final_Sigma2",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    72
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    73
        // Counterpart of After_Soft_Dotted test case
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    74
        //   0307; 0307;     ;     ; lt After_Soft_Dotted
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    75
            "0307; 0307; 0307; 0307; L1 After_Soft_Dotted",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    76
            "0307; 0307; 0307; 0307; lt SunSpecific_Not_After_Soft_Dotted",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    77
            "0307; 0307; 0307; 0307; L1 SunSpecific_Not_After_Soft_Dotted",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    78
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    79
        // Counterpart of More_Above test cases
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    80
        //   0049; 0069 0307; 0049; 0049; lt More_Above
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    81
            "0049; 0131     ; 0049; 0049; az More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    82
            "0049; 0131     ; 0049; 0049; tr More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    83
            "0049; 0069     ; 0049; 0049; L3 More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    84
            "0049; 0069     ; 0049; 0049; lt SunSpecific_Not_More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    85
            "0049; 0131     ; 0049; 0049; az SunSpecific_Not_More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    86
            "0049; 0131     ; 0049; 0049; tr SunSpecific_Not_More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    87
            "0049; 0069     ; 0049; 0049; L3 SunSpecific_Not_More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    88
        //   004A; 006A 0307; 004A; 004A; lt More_Above
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    89
            "004A; 006A     ; 004A; 004A; L1 More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    90
            "004A; 006A     ; 004A; 004A; lt SunSpecific_Not_More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    91
            "004A; 006A     ; 004A; 004A; L1 SunSpecific_Not_More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    92
        //   012E; 012F 0307; 012E; 012E; lt More_Above
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    93
            "012E; 012F     ; 012E; 012E; L1 More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    94
            "012E; 012F     ; 012E; 012E; lt SunSpecific_Not_More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    95
            "012E; 012F     ; 012E; 012E; L1 SunSpecific_Not_More_Above",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    96
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    97
        // Counterpart of After_I test cases
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    98
        //   0307;          ; 0307; 0307; tr After_I
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
    99
        //   0307;          ; 0307; 0307; az After_I
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   100
            "0307; 0307 0307; 0307; 0307; lt After_I",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   101
            "0307; 0307     ; 0307; 0307; L3 After_I",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   102
            "0307; 0307     ; 0307; 0307; tr SunSpecific_Not_After_I",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   103
            "0307; 0307     ; 0307; 0307; az SunSpecific_Not_After_I",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   104
            "0307; 0307     ; 0307; 0307; L2 SunSpecific_Not_After_I",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   105
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   106
        // Counterpart of Not_Before_Dot test cases
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   107
        //   0049; 0131          ; 0049; 0049; tr Not_Before_Dot
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   108
        //   0049; 0131          ; 0049; 0049; az Not_Before_Dot
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   109
            "0049; 0069          ; 0049; 0049; L2 Not_Before_Dot",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   110
            "0049; 0069          ; 0049; 0049; tr SunSpecific_Before_Dot",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   111
            "0049; 0069          ; 0049; 0049; az SunSpecific_Before_Dot",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   112
            "0049; 0069 0307 0307; 0049; 0049; lt SunSpecific_Before_Dot",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   113
            "0049; 0069 0307     ; 0049; 0049; L3 SunSpecific_Before_Dot",
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   114
    };
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   115
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   116
    public static void main (String[] args) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   117
        SpecialCasingTest specialCasingTest = new SpecialCasingTest();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   118
        specialCasingTest.test();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   119
    }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   120
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   121
    private void test ()  {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   122
        Locale defaultLocale = Locale.getDefault();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   123
        BufferedReader in = null;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   124
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   125
        try {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   126
            int locale_num = locales.size();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   127
            for (int l = 0; l < locale_num; l++) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   128
                Locale locale = locales.get(l);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   129
                Locale.setDefault(locale);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   130
                System.out.println("Testing on " + locale + " locale....");
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   131
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   132
                defaultLang = locale.getLanguage();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   133
                if (defaultLang.equals("az") ||
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   134
                    defaultLang.equals("lt") ||
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   135
                    defaultLang.equals("tr")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   136
                    specificLocale = true;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   137
                } else {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   138
                    specificLocale = false;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   139
                }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   140
                in = Files.newBufferedReader(Paths.get(System.getProperty("test.src.path"), "..", "/Character/SpecialCasing.txt")
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   141
                     .toRealPath());
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   142
                String line;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   143
                while ((line = in.readLine()) != null) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   144
                    if (line.length() == 0 || line.charAt(0) == '#') {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   145
                        continue;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   146
                    }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   147
                    test(line);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   148
                }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   149
                in.close();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   150
                in = null;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   151
                System.out.println("Testing with Sun original data....");
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   152
                for (String additionalTestData1 : additionalTestData) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   153
                    test(additionalTestData1);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   154
                }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   155
            }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   156
        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   157
        catch (IOException e) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   158
            err = true;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   159
            e.printStackTrace();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   160
        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   161
        finally {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   162
            if (in != null) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   163
                try {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   164
                    in.close();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   165
                }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   166
                catch (IOException e) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   167
                }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   168
            }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   169
            Locale.setDefault(defaultLocale);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   170
            if (err) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   171
                throw new RuntimeException("SpecialCasingTest failed.");
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   172
            } else {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   173
                System.out.println("*** SpecialCasingTest passed.");
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   174
            }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   175
        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   176
    }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   177
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   178
    private void test(String line) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   179
        int index = line.indexOf('#');
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   180
        if (index != -1) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   181
            line = line.substring(0, index);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   182
        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   183
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   184
        String lang = null;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   185
        String condition = null;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   186
        String[] fields = line.split("; ");
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   187
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   188
        for (int i = 0; i < 4; i++) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   189
            if (fields[i].length() != 0) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   190
                fields[i] = convert(fields[i]);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   191
            }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   192
        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   193
        if (fields.length != 4) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   194
            StringTokenizer st = new StringTokenizer(fields[4]);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   195
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   196
            while (st.hasMoreTokens()) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   197
                String token = st.nextToken();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   198
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   199
                if (token.equals("Final_Sigma")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   200
                    condition = "Final Sigma";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   201
                    fields[0] = "Abc" + fields[0];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   202
                    fields[1] = "abc" + fields[1];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   203
                    fields[3] = "ABC" + fields[3];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   204
                } else if (token.equals("SunSpecific_Not_Final_Sigma1")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   205
                    condition = "*Sun Specific* Not Final Sigma 1";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   206
                    fields[0] = "Abc" + fields[0] + "xyz";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   207
                    fields[1] = "abc" + fields[1] + "xyz";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   208
                    fields[3] = "ABC" + fields[3] + "XYZ";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   209
                } else if (token.equals("SunSpecific_Not_Final_Sigma2")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   210
                    condition = "*Sun Specific* Not Final Sigma 2";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   211
                } else if (token.equals("After_Soft_Dotted")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   212
                    condition = "After Soft-Dotted";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   213
                    fields[0] = "\u1E2D" + fields[0];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   214
                    fields[1] = "\u1E2D" + fields[1];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   215
                    fields[3] = "\u1E2C" + fields[3];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   216
                } else if (token.equals("SunSpecific_Not_After_Soft_Dotted")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   217
                    condition = "*Sun Specific* Not After Soft-Dotted";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   218
                    fields[0] = "Dot" + fields[0];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   219
                    fields[1] = "dot" + fields[1];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   220
                    fields[3] = "DOT" + fields[3];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   221
                } else if (token.equals("More_Above")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   222
                    condition = "More Above";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   223
                    fields[0] = fields[0] + "\u0306";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   224
                    fields[1] = fields[1] + "\u0306";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   225
                    fields[3] = fields[3] + "\u0306";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   226
                } else if (token.equals("SunSpecific_Not_More_Above")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   227
                    condition = "*Sun Specific* Not More Above";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   228
                    fields[0] = fields[0] + "breve";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   229
                    fields[1] = fields[1] + "breve";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   230
                    fields[3] = fields[3] + "BREVE";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   231
                } else if (token.equals("After_I")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   232
                    condition = "After I";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   233
                    fields[0] = "I" + fields[0];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   234
                    fields[1] = "i" + fields[1];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   235
                    fields[3] = "I" + fields[3];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   236
                } else if (token.equals("SunSpecific_Not_After_I")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   237
                    condition = "*Sun Specific* Not After I";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   238
                    fields[0] = "A" + fields[0];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   239
                    fields[1] = "a" + fields[1];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   240
                    fields[3] = "A" + fields[3];
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   241
                } else if (token.equals("Not_Before_Dot")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   242
                    condition = "Not Before Dot";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   243
                    fields[0] = fields[0] + "Z";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   244
                    fields[1] = fields[1] + "z";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   245
                    fields[3] = fields[3] + "Z";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   246
                } else if (token.equals("SunSpecific_Before_Dot")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   247
                    condition = "*Sun Specific* Before Dot";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   248
                    fields[0] = fields[0] + "\u0307";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   249
                    fields[3] = fields[3] + "\u0307";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   250
                } else if (token.length() == 2) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   251
                    lang = token;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   252
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   253
                    if (lang.equals("L1")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   254
                        if (defaultLang.equals("lt")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   255
                            lang = "en";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   256
                        } else {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   257
                            lang = defaultLang;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   258
                        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   259
                    } else if (lang.equals("L2")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   260
                        if (defaultLang.equals("az") ||
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   261
                            defaultLang.equals("tr")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   262
                            lang = "en";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   263
                        } else {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   264
                            lang = defaultLang;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   265
                        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   266
                    } else if (lang.equals("L3")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   267
                        if (defaultLang.equals("az") ||
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   268
                            defaultLang.equals("lt") ||
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   269
                            defaultLang.equals("tr")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   270
                            lang = "en";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   271
                        } else {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   272
                            lang = defaultLang;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   273
                        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   274
                    // I want to have another test case here for double-check.
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   275
                    // Current implementation for Character and String considers
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   276
                    // only az, lt, and tr locales. I want to detect if other
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   277
                    // locales are specified.
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   278
                    } else if (!lang.equals("az") &&
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   279
                               !lang.equals("lt") &&
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   280
                               !lang.equals("tr")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   281
                        throw new RuntimeException("Unsupported locale: " +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   282
                            lang + ". It may need to be considered in ConditionalSpecialCasing.java. Please confirm.");
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   283
                    }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   284
                } else {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   285
                    throw new RuntimeException("Unknown condition: " + token);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   286
                }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   287
            }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   288
        } else if (fields[0].equals("\u0130")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   289
            // special case for \u0130
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   290
            if (defaultLang.equals("az") ||
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   291
                defaultLang.equals("tr")) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   292
                lang = "en";
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   293
            } else {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   294
                lang = defaultLang;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   295
            }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   296
        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   297
        testLowerCase(fields[0], fields[1], lang, condition);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   298
        testUpperCase(fields[0], fields[3], lang, condition);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   299
    }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   300
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   301
    private void testLowerCase(String orig, String expected,
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   302
                               String lang, String condition) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   303
        String got = (lang == null) ?
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   304
            orig.toLowerCase() : orig.toLowerCase(new Locale(lang, ""));
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   305
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   306
        if (!expected.equals(got)) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   307
            err = true;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   308
            System.err.println("toLowerCase(lang=" + lang +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   309
                ") failed.\n\tOriginal: " + toString(orig) +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   310
                "\n\tGot:      " + toString(got) +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   311
                "\n\tExpected: " + toString(expected) +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   312
                ((condition == null) ? "" : ("\n    under condition(" +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   313
                condition + ")")));
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   314
        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   315
    }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   316
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   317
    private void testUpperCase(String orig, String expected,
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   318
                               String lang, String condition) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   319
        String got = (lang == null) ?
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   320
            orig.toUpperCase() : orig.toUpperCase(new Locale(lang, ""));
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   321
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   322
        if (!expected.equals(got)) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   323
            err = true;
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   324
            System.err.println("toUpperCase(lang=" + lang +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   325
                ") failed.\n\tOriginal: " + toString(orig) +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   326
                "\n\tGot:      " + toString(got) +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   327
                "\n\tExpected: " + toString(expected) +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   328
                ((condition == null) ? "" : ("\n    under condition(" +
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   329
                condition + ")")));
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   330
        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   331
    }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   332
    StringBuilder sb = new StringBuilder();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   333
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   334
    private String convert(String str) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   335
        sb.setLength(0);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   336
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   337
        String[] tokens = str.split(" ");
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   338
        for (String token : tokens) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   339
            sb.append((char) Integer.parseInt(token, 16));
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   340
        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   341
        return sb.toString();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   342
    }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   343
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   344
    private String toString(String str) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   345
        sb.setLength(0);
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   346
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   347
        int len = str.length();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   348
        for (int i = 0; i < len; i++) {
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   349
            sb.append("0x").append(Integer.toHexString(str.charAt(i)).toUpperCase()).append(" ");
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   350
        }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   351
        return sb.toString();
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   352
    }
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   353
d9d55f64d136 8191410: Unicode 10
rgoel
parents:
diff changeset
   354
}