jdk/src/share/classes/sun/text/resources/CollationData_th.java
author yhuang
Mon, 31 Oct 2011 21:30:11 -0700
changeset 10836 d9ac699afc2a
parent 5506 202f599c92aa
permissions -rw-r--r--
6755060: Collator.compare() does not compare correctly for the Thai locale Reviewed-by: naoto

/*
 * Copyright (c) 2011, Oracle and/or its affiliates. All rights reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.  Oracle designates this
 * particular file as subject to the "Classpath" exception as provided
 * by Oracle in the LICENSE file that accompanied this code.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 * or visit www.oracle.com if you need additional information or have any
 * questions.
 */

/*
 */

/*
 * (C) Copyright Taligent, Inc. 1996, 1997 - All Rights Reserved
 * (C) Copyright IBM Corp. 1996 - 1998 - All Rights Reserved
 *
 * The original version of this source code and documentation
 * is copyrighted and owned by Taligent, Inc., a wholly-owned
 * subsidiary of IBM. These materials are provided under terms
 * of a License Agreement between Taligent and Sun. This technology
 * is protected by multiple US and International patents.
 *
 * This notice and attribution to Taligent may not be removed.
 * Taligent is a registered trademark of Taligent, Inc.
 *
 */

package sun.text.resources;

import java.util.ListResourceBundle;

public class CollationData_th extends ListResourceBundle {

    protected final Object[][] getContents() {
        return new Object[][] {
            { "Rule",
                "! "                            // First turn on the SE Asian Vowel/Consonant
                                                // swapping rule
                + "& Z "                        // Put in all of the consonants, after Z
                + "< \u0E01 "                   //  KO KAI
                + "< \u0E02 "                   //  KHO KHAI
                + "< \u0E03 "                   //  KHO KHUAT
                + "< \u0E04 "                   //  KHO KHWAI
                + "< \u0E05 "                   //  KHO KHON
                + "< \u0E06 "                   //  KHO RAKHANG
                + "< \u0E07 "                   //  NGO NGU
                + "< \u0E08 "                   //  CHO CHAN
                + "< \u0E09 "                   //  CHO CHING
                + "< \u0E0A "                   //  CHO CHANG
                + "< \u0E0B "                   //  SO SO
                + "< \u0E0C "                   //  CHO CHOE
                + "< \u0E0D "                   //  YO YING
                + "< \u0E0E "                   //  DO CHADA
                + "< \u0E0F "                   //  TO PATAK
                + "< \u0E10 "                   //  THO THAN
                + "< \u0E11 "                   //  THO NANGMONTHO
                + "< \u0E12 "                   //  THO PHUTHAO
                + "< \u0E13 "                   //  NO NEN
                + "< \u0E14 "                   //  DO DEK
                + "< \u0E15 "                   //  TO TAO
                + "< \u0E16 "                   //  THO THUNG
                + "< \u0E17 "                   //  THO THAHAN
                + "< \u0E18 "                   //  THO THONG
                + "< \u0E19 "                   //  NO NU
                + "< \u0E1A "                   //  BO BAIMAI
                + "< \u0E1B "                   //  PO PLA
                + "< \u0E1C "                   //  PHO PHUNG
                + "< \u0E1D "                   //  FO FA
                + "< \u0E1E "                   //  PHO PHAN
                + "< \u0E1F "                   //  FO FAN
                + "< \u0E20 "                   //  PHO SAMPHAO
                + "< \u0E21 "                   //  MO MA
                + "< \u0E22 "                   //  YO YAK
                + "< \u0E23 "                   //  RO RUA
                + "< \u0E24 "                   //  RU
                + "< \u0E25 "                   //  LO LING
                + "< \u0E26 "                   //  LU
                + "< \u0E27 "                   //  WO WAEN
                + "< \u0E28 "                   //  SO SALA
                + "< \u0E29 "                   //  SO RUSI
                + "< \u0E2A "                   //  SO SUA
                + "< \u0E2B "                   //  HO HIP
                + "< \u0E2C "                   //  LO CHULA
                + "< \u0E2D "                   //  O ANG
                + "< \u0E2E "                   //  HO NOKHUK

                //
                // Normal vowels
                //
                + "< \u0E4D "                   //  NIKHAHIT
                + "< \u0E30 "                   //  SARA A
                + "< \u0E31 "                   //  MAI HAN-AKAT
                + "< \u0E32 "                   //  SARA AA

                // Normalizer will decompose this character to \u0e4d\u0e32.
                + "< \u0E33 = \u0E4D\u0E32 "                   //  SARA AM

                + "< \u0E34 "                   //  SARA I

                + "< \u0E35 "                   //  SARA II
                + "< \u0E36 "                   //  SARA UE
                + "< \u0E37 "                   //  SARA UEE
                + "< \u0E38 "                   //  SARA U
                + "< \u0E39 "                   //  SARA UU

                //
                // Preceding vowels
                //
                + "< \u0E40 "                   //  SARA E
                + "< \u0E41 "                   //  SARA AE
                + "< \u0E42 "                   //  SARA O
                + "< \u0E43 "                   //  SARA AI MAIMUAN
                + "< \u0E44 "                   //  SARA AI MAIMALAI


                //according to CLDR, it's after 0e44
                + "< \u0E3A "                   //  PHINTHU



                // This rare symbol comes after all characters.
                + "< \u0E45 "                   //  LAKKHANGYAO
                + "& \u0E32 , \0E45 "           // According to CLDR, 0E45 is after 0E32 in tertiary level




                // Below are thai puntuation marks and Tonal(Accent) marks. According to CLDR 1.9 and
                // ISO/IEC 14651, Annex C, C.2.1 Thai ordering principles, 0E2F to 0E5B are punctuaion marks that need to be ignored
                // in the first three leveles.  0E4E to 0E4B are tonal marks to be compared in secondary level.
                // In real implmentation, set puncutation marks in tertiary as there is no fourth level in Java.
                // Set all these special marks after \u0301, the accute accent.
                + "& \u0301 "   // acute accent

                //puncutation marks
                + ", \u0E2F "                   //  PAIYANNOI      (ellipsis, abbreviation)
                + ", \u0E46 "                   //  MAIYAMOK
                + ", \u0E4F "                   //  FONGMAN
                + ", \u0E5A "                   //  ANGKHANKHU
                + ", \u0E5B "                   //  KHOMUT

                //tonal marks
                + "; \u0E4E "                   //  YAMAKKAN
                + "; \u0E4C "                   //  THANTHAKHAT
                + "; \u0E47 "                   //  MAITAIKHU
                + "; \u0E48 "                   //  MAI EK
                + "; \u0E49 "                   //  MAI THO
                + "; \u0E4A "                   //  MAI TRI
                + "; \u0E4B "                   //  MAI CHATTAWA

                //
                // Digits are equal to their corresponding Arabic digits in the first level
                //
                + "& 0 = \u0E50 "                   //  DIGIT ZERO
                + "& 1 = \u0E51 "                   //  DIGIT ONE
                + "& 2 = \u0E52 "                   //  DIGIT TWO
                + "& 3 = \u0E53 "                   //  DIGIT THREE
                + "& 4 = \u0E54 "                   //  DIGIT FOUR
                + "& 5 = \u0E55 "                   //  DIGIT FIVE
                + "& 6 = \u0E56 "                   //  DIGIT SIX
                + "& 7 = \u0E57 "                   //  DIGIT SEVEN
                + "& 8 = \u0E58 "                   //  DIGIT EIGHT
                + "& 9 = \u0E59 "                   //  DIGIT NINE


            }
        };
    }
}