jdk/src/share/classes/sun/text/resources/CollationData_th.java
changeset 2 90ce3da70b43
child 5506 202f599c92aa
equal deleted inserted replaced
0:fd16c54261b3 2:90ce3da70b43
       
     1 /*
       
     2  * Portions Copyright 2005 Sun Microsystems, Inc.  All Rights Reserved.
       
     3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
       
     4  *
       
     5  * This code is free software; you can redistribute it and/or modify it
       
     6  * under the terms of the GNU General Public License version 2 only, as
       
     7  * published by the Free Software Foundation.  Sun designates this
       
     8  * particular file as subject to the "Classpath" exception as provided
       
     9  * by Sun in the LICENSE file that accompanied this code.
       
    10  *
       
    11  * This code is distributed in the hope that it will be useful, but WITHOUT
       
    12  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
       
    13  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
       
    14  * version 2 for more details (a copy is included in the LICENSE file that
       
    15  * accompanied this code).
       
    16  *
       
    17  * You should have received a copy of the GNU General Public License version
       
    18  * 2 along with this work; if not, write to the Free Software Foundation,
       
    19  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
       
    20  *
       
    21  * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
       
    22  * CA 95054 USA or visit www.sun.com if you need additional information or
       
    23  * have any questions.
       
    24  */
       
    25 
       
    26 /*
       
    27  */
       
    28 
       
    29 /*
       
    30  * (C) Copyright Taligent, Inc. 1996, 1997 - All Rights Reserved
       
    31  * (C) Copyright IBM Corp. 1996 - 1998 - All Rights Reserved
       
    32  *
       
    33  * The original version of this source code and documentation
       
    34  * is copyrighted and owned by Taligent, Inc., a wholly-owned
       
    35  * subsidiary of IBM. These materials are provided under terms
       
    36  * of a License Agreement between Taligent and Sun. This technology
       
    37  * is protected by multiple US and International patents.
       
    38  *
       
    39  * This notice and attribution to Taligent may not be removed.
       
    40  * Taligent is a registered trademark of Taligent, Inc.
       
    41  *
       
    42  */
       
    43 
       
    44 package sun.text.resources;
       
    45 
       
    46 import java.util.ListResourceBundle;
       
    47 
       
    48 public class CollationData_th extends ListResourceBundle {
       
    49 
       
    50     protected final Object[][] getContents() {
       
    51         return new Object[][] {
       
    52             { "Rule",
       
    53                 "! "                            // First turn on the SE Asian Vowel/Consonant
       
    54                                                 // swapping rule
       
    55                 + "& Z "                        // Put in all of the consonants, after Z
       
    56                 + "< \u0E01 "                   //  KO KAI
       
    57                 + "< \u0E02 "                   //  KHO KHAI
       
    58                 + "< \u0E03 "                   //  KHO KHUAT
       
    59                 + "< \u0E04 "                   //  KHO KHWAI
       
    60                 + "< \u0E05 "                   //  KHO KHON
       
    61                 + "< \u0E06 "                   //  KHO RAKHANG
       
    62                 + "< \u0E07 "                   //  NGO NGU
       
    63                 + "< \u0E08 "                   //  CHO CHAN
       
    64                 + "< \u0E09 "                   //  CHO CHING
       
    65                 + "< \u0E0A "                   //  CHO CHANG
       
    66                 + "< \u0E0B "                   //  SO SO
       
    67                 + "< \u0E0C "                   //  CHO CHOE
       
    68                 + "< \u0E0D "                   //  YO YING
       
    69                 + "< \u0E0E "                   //  DO CHADA
       
    70                 + "< \u0E0F "                   //  TO PATAK
       
    71                 + "< \u0E10 "                   //  THO THAN
       
    72                 + "< \u0E11 "                   //  THO NANGMONTHO
       
    73                 + "< \u0E12 "                   //  THO PHUTHAO
       
    74                 + "< \u0E13 "                   //  NO NEN
       
    75                 + "< \u0E14 "                   //  DO DEK
       
    76                 + "< \u0E15 "                   //  TO TAO
       
    77                 + "< \u0E16 "                   //  THO THUNG
       
    78                 + "< \u0E17 "                   //  THO THAHAN
       
    79                 + "< \u0E18 "                   //  THO THONG
       
    80                 + "< \u0E19 "                   //  NO NU
       
    81                 + "< \u0E1A "                   //  BO BAIMAI
       
    82                 + "< \u0E1B "                   //  PO PLA
       
    83                 + "< \u0E1C "                   //  PHO PHUNG
       
    84                 + "< \u0E1D "                   //  FO FA
       
    85                 + "< \u0E1E "                   //  PHO PHAN
       
    86                 + "< \u0E1F "                   //  FO FAN
       
    87                 + "< \u0E20 "                   //  PHO SAMPHAO
       
    88                 + "< \u0E21 "                   //  MO MA
       
    89                 + "< \u0E22 "                   //  YO YAK
       
    90                 + "< \u0E23 "                   //  RO RUA
       
    91                 + "< \u0E24 "                   //  RU
       
    92                 + "< \u0E25 "                   //  LO LING
       
    93                 + "< \u0E26 "                   //  LU
       
    94                 + "< \u0E27 "                   //  WO WAEN
       
    95                 + "< \u0E28 "                   //  SO SALA
       
    96                 + "< \u0E29 "                   //  SO RUSI
       
    97                 + "< \u0E2A "                   //  SO SUA
       
    98                 + "< \u0E2B "                   //  HO HIP
       
    99                 + "< \u0E2C "                   //  LO CHULA
       
   100                 + "< \u0E2D "                   //  O ANG
       
   101                 + "< \u0E2E "                   //  HO NOKHUK
       
   102 
       
   103                 //
       
   104                 // Normal vowels
       
   105                 //
       
   106                 + "< \u0E30 "                   //  SARA A
       
   107                 + "< \u0E31 "                   //  MAI HAN-AKAT
       
   108                 + "< \u0E32 "                   //  SARA AA
       
   109 
       
   110                 // Normalizer will decompose this character to \u0e4d\u0e32.  This is
       
   111                 // a Bad Thing, because we want the separate characters to sort
       
   112                 // differently than this individual one.  Since there's no public way to
       
   113                 // set the decomposition to be used when creating a collator, there's
       
   114                 // no way around this right now.
       
   115                 // It's best to go ahead and leave the character in, because it occurs
       
   116                 // this way a lot more often than it occurs as separate characters.
       
   117                 + "< \u0E33 "                   //  SARA AM
       
   118 
       
   119                 + "< \u0E34 "                   //  SARA I
       
   120 
       
   121                 + "< \u0E35 "                   //  SARA II
       
   122                 + "< \u0E36 "                   //  SARA UE
       
   123                 + "< \u0E37 "                   //  SARA UEE
       
   124                 + "< \u0E38 "                   //  SARA U
       
   125                 + "< \u0E39 "                   //  SARA UU
       
   126 
       
   127                 //
       
   128                 // Preceding vowels
       
   129                 //
       
   130                 + "< \u0E40 "                   //  SARA E
       
   131                 + "< \u0E41 "                   //  SARA AE
       
   132                 + "< \u0E42 "                   //  SARA O
       
   133                 + "< \u0E43 "                   //  SARA AI MAIMUAN
       
   134                 + "< \u0E44 "                   //  SARA AI MAIMALAI
       
   135 
       
   136                 //
       
   137                 // Digits
       
   138                 //
       
   139                 + "< \u0E50 "                   //  DIGIT ZERO
       
   140                 + "< \u0E51 "                   //  DIGIT ONE
       
   141                 + "< \u0E52 "                   //  DIGIT TWO
       
   142                 + "< \u0E53 "                   //  DIGIT THREE
       
   143                 + "< \u0E54 "                   //  DIGIT FOUR
       
   144                 + "< \u0E55 "                   //  DIGIT FIVE
       
   145                 + "< \u0E56 "                   //  DIGIT SIX
       
   146                 + "< \u0E57 "                   //  DIGIT SEVEN
       
   147                 + "< \u0E58 "                   //  DIGIT EIGHT
       
   148                 + "< \u0E59 "                   //  DIGIT NINE
       
   149 
       
   150                 // Sorta tonal marks, but maybe not really
       
   151                 + "< \u0E4D "                   //  NIKHAHIT
       
   152 
       
   153                 //
       
   154                 // Thai symbols are supposed to sort "after white space".
       
   155                 // I'm treating this as making them sort just after the normal Latin-1
       
   156                 // symbols, which are in turn after the white space.
       
   157                 //
       
   158                 + "&'\u007d'"  //  right-brace
       
   159                 + "< \u0E2F "                   //  PAIYANNOI      (ellipsis, abbreviation)
       
   160                 + "< \u0E46 "                   //  MAIYAMOK
       
   161                 + "< \u0E4F "                   //  FONGMAN
       
   162                 + "< \u0E5A "                   //  ANGKHANKHU
       
   163                 + "< \u0E5B "                   //  KHOMUT
       
   164                 + "< \u0E3F "                   //  CURRENCY SYMBOL BAHT
       
   165 
       
   166                 // These symbols are supposed to be "after all characters"
       
   167                 + "< \u0E4E "                   //  YAMAKKAN
       
   168 
       
   169                 // This rare symbol also comes after all characters.  But when it is
       
   170                 // used in combination with RU and LU, the combination is treated as
       
   171                 // a separate letter, ala "CH" sorting after "C" in traditional Spanish.
       
   172                 + "< \u0E45 "                   //  LAKKHANGYAO
       
   173                 + "& \u0E24 < \u0E24\u0E45 "
       
   174                 + "& \u0E26 < \u0E26\u0E45 "
       
   175 
       
   176                 // Tonal marks are primary ignorables but are treated as secondary
       
   177                 // differences
       
   178                 + "& \u0301 "   // acute accent
       
   179                 + "; \u0E47 "                   //  MAITAIKHU
       
   180                 + "; \u0E48 "                   //  MAI EK
       
   181                 + "; \u0E49 "                   //  MAI THO
       
   182                 + "; \u0E4A "                   //  MAI TRI
       
   183                 + "; \u0E4B "                   //  MAI CHATTAWA
       
   184                 + "; \u0E4C "                   //  THANTHAKHAT
       
   185 
       
   186 
       
   187                 // These are supposed to be ignored, so I'm treating them as controls
       
   188                 + "& \u0001 "
       
   189                 + "= \u0E3A "                   //  PHINTHU
       
   190                 + "= '.' "                      //  period
       
   191                 }
       
   192         };
       
   193     }
       
   194 }