2
|
1 |
/*
|
|
2 |
* Portions Copyright 2005 Sun Microsystems, Inc. All Rights Reserved.
|
|
3 |
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
4 |
*
|
|
5 |
* This code is free software; you can redistribute it and/or modify it
|
|
6 |
* under the terms of the GNU General Public License version 2 only, as
|
|
7 |
* published by the Free Software Foundation. Sun designates this
|
|
8 |
* particular file as subject to the "Classpath" exception as provided
|
|
9 |
* by Sun in the LICENSE file that accompanied this code.
|
|
10 |
*
|
|
11 |
* This code is distributed in the hope that it will be useful, but WITHOUT
|
|
12 |
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
13 |
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
14 |
* version 2 for more details (a copy is included in the LICENSE file that
|
|
15 |
* accompanied this code).
|
|
16 |
*
|
|
17 |
* You should have received a copy of the GNU General Public License version
|
|
18 |
* 2 along with this work; if not, write to the Free Software Foundation,
|
|
19 |
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
20 |
*
|
|
21 |
* Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
|
|
22 |
* CA 95054 USA or visit www.sun.com if you need additional information or
|
|
23 |
* have any questions.
|
|
24 |
*/
|
|
25 |
|
|
26 |
/*
|
|
27 |
*/
|
|
28 |
|
|
29 |
/*
|
|
30 |
* (C) Copyright Taligent, Inc. 1996, 1997 - All Rights Reserved
|
|
31 |
* (C) Copyright IBM Corp. 1996 - 1998 - All Rights Reserved
|
|
32 |
*
|
|
33 |
* The original version of this source code and documentation
|
|
34 |
* is copyrighted and owned by Taligent, Inc., a wholly-owned
|
|
35 |
* subsidiary of IBM. These materials are provided under terms
|
|
36 |
* of a License Agreement between Taligent and Sun. This technology
|
|
37 |
* is protected by multiple US and International patents.
|
|
38 |
*
|
|
39 |
* This notice and attribution to Taligent may not be removed.
|
|
40 |
* Taligent is a registered trademark of Taligent, Inc.
|
|
41 |
*
|
|
42 |
*/
|
|
43 |
|
|
44 |
package sun.text.resources;
|
|
45 |
|
|
46 |
import java.util.ListResourceBundle;
|
|
47 |
|
|
48 |
public class CollationData_th extends ListResourceBundle {
|
|
49 |
|
|
50 |
protected final Object[][] getContents() {
|
|
51 |
return new Object[][] {
|
|
52 |
{ "Rule",
|
|
53 |
"! " // First turn on the SE Asian Vowel/Consonant
|
|
54 |
// swapping rule
|
|
55 |
+ "& Z " // Put in all of the consonants, after Z
|
|
56 |
+ "< \u0E01 " // KO KAI
|
|
57 |
+ "< \u0E02 " // KHO KHAI
|
|
58 |
+ "< \u0E03 " // KHO KHUAT
|
|
59 |
+ "< \u0E04 " // KHO KHWAI
|
|
60 |
+ "< \u0E05 " // KHO KHON
|
|
61 |
+ "< \u0E06 " // KHO RAKHANG
|
|
62 |
+ "< \u0E07 " // NGO NGU
|
|
63 |
+ "< \u0E08 " // CHO CHAN
|
|
64 |
+ "< \u0E09 " // CHO CHING
|
|
65 |
+ "< \u0E0A " // CHO CHANG
|
|
66 |
+ "< \u0E0B " // SO SO
|
|
67 |
+ "< \u0E0C " // CHO CHOE
|
|
68 |
+ "< \u0E0D " // YO YING
|
|
69 |
+ "< \u0E0E " // DO CHADA
|
|
70 |
+ "< \u0E0F " // TO PATAK
|
|
71 |
+ "< \u0E10 " // THO THAN
|
|
72 |
+ "< \u0E11 " // THO NANGMONTHO
|
|
73 |
+ "< \u0E12 " // THO PHUTHAO
|
|
74 |
+ "< \u0E13 " // NO NEN
|
|
75 |
+ "< \u0E14 " // DO DEK
|
|
76 |
+ "< \u0E15 " // TO TAO
|
|
77 |
+ "< \u0E16 " // THO THUNG
|
|
78 |
+ "< \u0E17 " // THO THAHAN
|
|
79 |
+ "< \u0E18 " // THO THONG
|
|
80 |
+ "< \u0E19 " // NO NU
|
|
81 |
+ "< \u0E1A " // BO BAIMAI
|
|
82 |
+ "< \u0E1B " // PO PLA
|
|
83 |
+ "< \u0E1C " // PHO PHUNG
|
|
84 |
+ "< \u0E1D " // FO FA
|
|
85 |
+ "< \u0E1E " // PHO PHAN
|
|
86 |
+ "< \u0E1F " // FO FAN
|
|
87 |
+ "< \u0E20 " // PHO SAMPHAO
|
|
88 |
+ "< \u0E21 " // MO MA
|
|
89 |
+ "< \u0E22 " // YO YAK
|
|
90 |
+ "< \u0E23 " // RO RUA
|
|
91 |
+ "< \u0E24 " // RU
|
|
92 |
+ "< \u0E25 " // LO LING
|
|
93 |
+ "< \u0E26 " // LU
|
|
94 |
+ "< \u0E27 " // WO WAEN
|
|
95 |
+ "< \u0E28 " // SO SALA
|
|
96 |
+ "< \u0E29 " // SO RUSI
|
|
97 |
+ "< \u0E2A " // SO SUA
|
|
98 |
+ "< \u0E2B " // HO HIP
|
|
99 |
+ "< \u0E2C " // LO CHULA
|
|
100 |
+ "< \u0E2D " // O ANG
|
|
101 |
+ "< \u0E2E " // HO NOKHUK
|
|
102 |
|
|
103 |
//
|
|
104 |
// Normal vowels
|
|
105 |
//
|
|
106 |
+ "< \u0E30 " // SARA A
|
|
107 |
+ "< \u0E31 " // MAI HAN-AKAT
|
|
108 |
+ "< \u0E32 " // SARA AA
|
|
109 |
|
|
110 |
// Normalizer will decompose this character to \u0e4d\u0e32. This is
|
|
111 |
// a Bad Thing, because we want the separate characters to sort
|
|
112 |
// differently than this individual one. Since there's no public way to
|
|
113 |
// set the decomposition to be used when creating a collator, there's
|
|
114 |
// no way around this right now.
|
|
115 |
// It's best to go ahead and leave the character in, because it occurs
|
|
116 |
// this way a lot more often than it occurs as separate characters.
|
|
117 |
+ "< \u0E33 " // SARA AM
|
|
118 |
|
|
119 |
+ "< \u0E34 " // SARA I
|
|
120 |
|
|
121 |
+ "< \u0E35 " // SARA II
|
|
122 |
+ "< \u0E36 " // SARA UE
|
|
123 |
+ "< \u0E37 " // SARA UEE
|
|
124 |
+ "< \u0E38 " // SARA U
|
|
125 |
+ "< \u0E39 " // SARA UU
|
|
126 |
|
|
127 |
//
|
|
128 |
// Preceding vowels
|
|
129 |
//
|
|
130 |
+ "< \u0E40 " // SARA E
|
|
131 |
+ "< \u0E41 " // SARA AE
|
|
132 |
+ "< \u0E42 " // SARA O
|
|
133 |
+ "< \u0E43 " // SARA AI MAIMUAN
|
|
134 |
+ "< \u0E44 " // SARA AI MAIMALAI
|
|
135 |
|
|
136 |
//
|
|
137 |
// Digits
|
|
138 |
//
|
|
139 |
+ "< \u0E50 " // DIGIT ZERO
|
|
140 |
+ "< \u0E51 " // DIGIT ONE
|
|
141 |
+ "< \u0E52 " // DIGIT TWO
|
|
142 |
+ "< \u0E53 " // DIGIT THREE
|
|
143 |
+ "< \u0E54 " // DIGIT FOUR
|
|
144 |
+ "< \u0E55 " // DIGIT FIVE
|
|
145 |
+ "< \u0E56 " // DIGIT SIX
|
|
146 |
+ "< \u0E57 " // DIGIT SEVEN
|
|
147 |
+ "< \u0E58 " // DIGIT EIGHT
|
|
148 |
+ "< \u0E59 " // DIGIT NINE
|
|
149 |
|
|
150 |
// Sorta tonal marks, but maybe not really
|
|
151 |
+ "< \u0E4D " // NIKHAHIT
|
|
152 |
|
|
153 |
//
|
|
154 |
// Thai symbols are supposed to sort "after white space".
|
|
155 |
// I'm treating this as making them sort just after the normal Latin-1
|
|
156 |
// symbols, which are in turn after the white space.
|
|
157 |
//
|
|
158 |
+ "&'\u007d'" // right-brace
|
|
159 |
+ "< \u0E2F " // PAIYANNOI (ellipsis, abbreviation)
|
|
160 |
+ "< \u0E46 " // MAIYAMOK
|
|
161 |
+ "< \u0E4F " // FONGMAN
|
|
162 |
+ "< \u0E5A " // ANGKHANKHU
|
|
163 |
+ "< \u0E5B " // KHOMUT
|
|
164 |
+ "< \u0E3F " // CURRENCY SYMBOL BAHT
|
|
165 |
|
|
166 |
// These symbols are supposed to be "after all characters"
|
|
167 |
+ "< \u0E4E " // YAMAKKAN
|
|
168 |
|
|
169 |
// This rare symbol also comes after all characters. But when it is
|
|
170 |
// used in combination with RU and LU, the combination is treated as
|
|
171 |
// a separate letter, ala "CH" sorting after "C" in traditional Spanish.
|
|
172 |
+ "< \u0E45 " // LAKKHANGYAO
|
|
173 |
+ "& \u0E24 < \u0E24\u0E45 "
|
|
174 |
+ "& \u0E26 < \u0E26\u0E45 "
|
|
175 |
|
|
176 |
// Tonal marks are primary ignorables but are treated as secondary
|
|
177 |
// differences
|
|
178 |
+ "& \u0301 " // acute accent
|
|
179 |
+ "; \u0E47 " // MAITAIKHU
|
|
180 |
+ "; \u0E48 " // MAI EK
|
|
181 |
+ "; \u0E49 " // MAI THO
|
|
182 |
+ "; \u0E4A " // MAI TRI
|
|
183 |
+ "; \u0E4B " // MAI CHATTAWA
|
|
184 |
+ "; \u0E4C " // THANTHAKHAT
|
|
185 |
|
|
186 |
|
|
187 |
// These are supposed to be ignored, so I'm treating them as controls
|
|
188 |
+ "& \u0001 "
|
|
189 |
+ "= \u0E3A " // PHINTHU
|
|
190 |
+ "= '.' " // period
|
|
191 |
}
|
|
192 |
};
|
|
193 |
}
|
|
194 |
}
|