author | ihse |
Mon, 25 Sep 2017 10:32:00 +0200 | |
changeset 47253 | 92fd0e04e0e1 |
parent 47216 | 71c04702a3d5 |
child 50045 | d9d55f64d136 |
permissions | -rw-r--r-- |
2 | 1 |
/* |
31680 | 2 |
* Copyright (c) 2003, 2015, Oracle and/or its affiliates. All rights reserved. |
2 | 3 |
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
4 |
* |
|
5 |
* This code is free software; you can redistribute it and/or modify it |
|
6 |
* under the terms of the GNU General Public License version 2 only, as |
|
5506 | 7 |
* published by the Free Software Foundation. Oracle designates this |
2 | 8 |
* particular file as subject to the "Classpath" exception as provided |
5506 | 9 |
* by Oracle in the LICENSE file that accompanied this code. |
2 | 10 |
* |
11 |
* This code is distributed in the hope that it will be useful, but WITHOUT |
|
12 |
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
|
13 |
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
|
14 |
* version 2 for more details (a copy is included in the LICENSE file that |
|
15 |
* accompanied this code). |
|
16 |
* |
|
17 |
* You should have received a copy of the GNU General Public License version |
|
18 |
* 2 along with this work; if not, write to the Free Software Foundation, |
|
19 |
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
|
20 |
* |
|
5506 | 21 |
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
22 |
* or visit www.oracle.com if you need additional information or have any |
|
23 |
* questions. |
|
2 | 24 |
*/ |
25 |
||
26 |
package java.lang; |
|
27 |
||
28 |
/** The CharacterData class encapsulates the large tables once found in |
|
29 |
* java.lang.Character. |
|
30 |
*/ |
|
31 |
||
32 |
class CharacterData01 extends CharacterData { |
|
33 |
/* The character properties are currently encoded into 32 bits in the following manner: |
|
34 |
1 bit mirrored property |
|
35 |
4 bits directionality property |
|
36 |
9 bits signed offset used for converting case |
|
37 |
1 bit if 1, adding the signed offset converts the character to lowercase |
|
38 |
1 bit if 1, subtracting the signed offset converts the character to uppercase |
|
39 |
1 bit if 1, this character has a titlecase equivalent (possibly itself) |
|
40 |
3 bits 0 may not be part of an identifier |
|
41 |
1 ignorable control; may continue a Unicode identifier or Java identifier |
|
42 |
2 may continue a Java identifier but not a Unicode identifier (unused) |
|
43 |
3 may continue a Unicode identifier or Java identifier |
|
44 |
4 is a Java whitespace character |
|
45 |
5 may start or continue a Java identifier; |
|
46 |
may continue but not start a Unicode identifier (underscores) |
|
47 |
6 may start or continue a Java identifier but not a Unicode identifier ($) |
|
48 |
7 may start or continue a Unicode identifier or Java identifier |
|
49 |
Thus: |
|
50 |
5, 6, 7 may start a Java identifier |
|
51 |
1, 2, 3, 5, 6, 7 may continue a Java identifier |
|
52 |
7 may start a Unicode identifier |
|
53 |
1, 3, 5, 7 may continue a Unicode identifier |
|
54 |
1 is ignorable within an identifier |
|
55 |
4 is Java whitespace |
|
56 |
2 bits 0 this character has no numeric property |
|
57 |
1 adding the digit offset to the character code and then |
|
58 |
masking with 0x1F will produce the desired numeric value |
|
59 |
2 this character has a "strange" numeric value |
|
60 |
3 a Java supradecimal digit: adding the digit offset to the |
|
61 |
character code, then masking with 0x1F, then adding 10 |
|
62 |
will produce the desired numeric value |
|
63 |
5 bits digit offset |
|
64 |
5 bits character type |
|
65 |
||
66 |
The encoding of character properties is subject to change at any time. |
|
67 |
*/ |
|
68 |
||
69 |
int getProperties(int ch) { |
|
70 |
char offset = (char)ch; |
|
71 |
int props = $$Lookup(offset); |
|
72 |
return props; |
|
73 |
} |
|
74 |
||
9535
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
75 |
int getPropertiesEx(int ch) { |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
76 |
char offset = (char)ch; |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
77 |
int props = $$LookupEx(offset); |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
78 |
return props; |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
79 |
} |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
80 |
|
2 | 81 |
int getType(int ch) { |
82 |
int props = getProperties(ch); |
|
83 |
return (props & $$maskType); |
|
84 |
} |
|
85 |
||
9535
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
86 |
boolean isOtherLowercase(int ch) { |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
87 |
int props = getPropertiesEx(ch); |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
88 |
return (props & $$maskOtherLowercase) != 0; |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
89 |
} |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
90 |
|
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
91 |
boolean isOtherUppercase(int ch) { |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
92 |
int props = getPropertiesEx(ch); |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
93 |
return (props & $$maskOtherUppercase) != 0; |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
94 |
} |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
95 |
|
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
96 |
boolean isOtherAlphabetic(int ch) { |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
97 |
int props = getPropertiesEx(ch); |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
98 |
return (props & $$maskOtherAlphabetic) != 0; |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
99 |
} |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
100 |
|
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
101 |
boolean isIdeographic(int ch) { |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
102 |
int props = getPropertiesEx(ch); |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
103 |
return (props & $$maskIdeographic) != 0; |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
104 |
} |
d930011fd275
7037261: j.l.Character.isLowerCase/isUpperCase need to match the Unicode Standard
sherman
parents:
7247
diff
changeset
|
105 |
|
2 | 106 |
boolean isJavaIdentifierStart(int ch) { |
107 |
int props = getProperties(ch); |
|
108 |
return ((props & $$maskIdentifierInfo) >= $$lowJavaStart); |
|
109 |
} |
|
110 |
||
111 |
boolean isJavaIdentifierPart(int ch) { |
|
112 |
int props = getProperties(ch); |
|
113 |
return ((props & $$nonzeroJavaPart) != 0); |
|
114 |
} |
|
115 |
||
116 |
boolean isUnicodeIdentifierStart(int ch) { |
|
117 |
int props = getProperties(ch); |
|
118 |
return ((props & $$maskIdentifierInfo) == $$valueUnicodeStart); |
|
119 |
} |
|
120 |
||
121 |
boolean isUnicodeIdentifierPart(int ch) { |
|
122 |
int props = getProperties(ch); |
|
123 |
return ((props & $$maskUnicodePart) != 0); |
|
124 |
} |
|
125 |
||
126 |
boolean isIdentifierIgnorable(int ch) { |
|
127 |
int props = getProperties(ch); |
|
128 |
return ((props & $$maskIdentifierInfo) == $$valueIgnorable); |
|
129 |
} |
|
130 |
||
131 |
int toLowerCase(int ch) { |
|
132 |
int mapChar = ch; |
|
133 |
int val = getProperties(ch); |
|
134 |
||
135 |
if ((val & $$maskLowerCase) != 0) { |
|
136 |
int offset = val << $$shiftCaseOffsetSign >> ($$shiftCaseOffsetSign+$$shiftCaseOffset); |
|
137 |
mapChar = ch + offset; |
|
138 |
} |
|
139 |
return mapChar; |
|
140 |
} |
|
141 |
||
142 |
int toUpperCase(int ch) { |
|
143 |
int mapChar = ch; |
|
144 |
int val = getProperties(ch); |
|
145 |
||
146 |
if ((val & $$maskUpperCase) != 0) { |
|
147 |
int offset = val << $$shiftCaseOffsetSign >> ($$shiftCaseOffsetSign+$$shiftCaseOffset); |
|
148 |
mapChar = ch - offset; |
|
149 |
} |
|
150 |
return mapChar; |
|
151 |
} |
|
152 |
||
153 |
int toTitleCase(int ch) { |
|
154 |
int mapChar = ch; |
|
155 |
int val = getProperties(ch); |
|
156 |
||
157 |
if ((val & $$maskTitleCase) != 0) { |
|
158 |
// There is a titlecase equivalent. Perform further checks: |
|
159 |
if ((val & $$maskUpperCase) == 0) { |
|
160 |
// The character does not have an uppercase equivalent, so it must |
|
161 |
// already be uppercase; so add 1 to get the titlecase form. |
|
162 |
mapChar = ch + 1; |
|
163 |
} |
|
164 |
else if ((val & $$maskLowerCase) == 0) { |
|
165 |
// The character does not have a lowercase equivalent, so it must |
|
166 |
// already be lowercase; so subtract 1 to get the titlecase form. |
|
167 |
mapChar = ch - 1; |
|
168 |
} |
|
169 |
// else { |
|
170 |
// The character has both an uppercase equivalent and a lowercase |
|
171 |
// equivalent, so it must itself be a titlecase form; return it. |
|
172 |
// return ch; |
|
173 |
//} |
|
174 |
} |
|
175 |
else if ((val & $$maskUpperCase) != 0) { |
|
176 |
// This character has no titlecase equivalent but it does have an |
|
177 |
// uppercase equivalent, so use that (subtract the signed case offset). |
|
178 |
mapChar = toUpperCase(ch); |
|
179 |
} |
|
180 |
return mapChar; |
|
181 |
} |
|
182 |
||
183 |
int digit(int ch, int radix) { |
|
184 |
int value = -1; |
|
185 |
if (radix >= Character.MIN_RADIX && radix <= Character.MAX_RADIX) { |
|
186 |
int val = getProperties(ch); |
|
187 |
int kind = val & $$maskType; |
|
188 |
if (kind == Character.DECIMAL_DIGIT_NUMBER) { |
|
189 |
value = ch + ((val & $$maskDigitOffset) >> $$shiftDigitOffset) & $$maskDigit; |
|
190 |
} |
|
191 |
else if ((val & $$maskNumericType) == $$valueJavaSupradecimal) { |
|
192 |
// Java supradecimal digit |
|
193 |
value = (ch + ((val & $$maskDigitOffset) >> $$shiftDigitOffset) & $$maskDigit) + 10; |
|
194 |
} |
|
195 |
} |
|
196 |
return (value < radix) ? value : -1; |
|
197 |
} |
|
198 |
||
199 |
int getNumericValue(int ch) { |
|
200 |
int val = getProperties(ch); |
|
201 |
int retval = -1; |
|
202 |
||
203 |
switch (val & $$maskNumericType) { |
|
204 |
default: // cannot occur |
|
205 |
case ($$valueNotNumeric): // not numeric |
|
206 |
retval = -1; |
|
207 |
break; |
|
208 |
case ($$valueDigit): // simple numeric |
|
209 |
retval = ch + ((val & $$maskDigitOffset) >> $$shiftDigitOffset) & $$maskDigit; |
|
210 |
break; |
|
211 |
case ($$valueStrangeNumeric) : // "strange" numeric |
|
212 |
switch(ch) { |
|
213 |
case 0x10113: retval = 40; break; // AEGEAN NUMBER FORTY |
|
214 |
case 0x10114: retval = 50; break; // AEGEAN NUMBER FIFTY |
|
215 |
case 0x10115: retval = 60; break; // AEGEAN NUMBER SIXTY |
|
216 |
case 0x10116: retval = 70; break; // AEGEAN NUMBER SEVENTY |
|
217 |
case 0x10117: retval = 80; break; // AEGEAN NUMBER EIGHTY |
|
218 |
case 0x10118: retval = 90; break; // AEGEAN NUMBER NINETY |
|
219 |
case 0x10119: retval = 100; break; // AEGEAN NUMBER ONE HUNDRED |
|
220 |
case 0x1011A: retval = 200; break; // AEGEAN NUMBER TWO HUNDRED |
|
221 |
case 0x1011B: retval = 300; break; // AEGEAN NUMBER THREE HUNDRED |
|
222 |
case 0x1011C: retval = 400; break; // AEGEAN NUMBER FOUR HUNDRED |
|
223 |
case 0x1011D: retval = 500; break; // AEGEAN NUMBER FIVE HUNDRED |
|
224 |
case 0x1011E: retval = 600; break; // AEGEAN NUMBER SIX HUNDRED |
|
225 |
case 0x1011F: retval = 700; break; // AEGEAN NUMBER SEVEN HUNDRED |
|
226 |
case 0x10120: retval = 800; break; // AEGEAN NUMBER EIGHT HUNDRED |
|
227 |
case 0x10121: retval = 900; break; // AEGEAN NUMBER NINE HUNDRED |
|
228 |
case 0x10122: retval = 1000; break; // AEGEAN NUMBER ONE THOUSAND |
|
229 |
case 0x10123: retval = 2000; break; // AEGEAN NUMBER TWO THOUSAND |
|
230 |
case 0x10124: retval = 3000; break; // AEGEAN NUMBER THREE THOUSAND |
|
231 |
case 0x10125: retval = 4000; break; // AEGEAN NUMBER FOUR THOUSAND |
|
232 |
case 0x10126: retval = 5000; break; // AEGEAN NUMBER FIVE THOUSAND |
|
233 |
case 0x10127: retval = 6000; break; // AEGEAN NUMBER SIX THOUSAND |
|
234 |
case 0x10128: retval = 7000; break; // AEGEAN NUMBER SEVEN THOUSAND |
|
235 |
case 0x10129: retval = 8000; break; // AEGEAN NUMBER EIGHT THOUSAND |
|
236 |
case 0x1012A: retval = 9000; break; // AEGEAN NUMBER NINE THOUSAND |
|
237 |
case 0x1012B: retval = 10000; break; // AEGEAN NUMBER TEN THOUSAND |
|
238 |
case 0x1012C: retval = 20000; break; // AEGEAN NUMBER TWENTY THOUSAND |
|
239 |
case 0x1012D: retval = 30000; break; // AEGEAN NUMBER THIRTY THOUSAND |
|
240 |
case 0x1012E: retval = 40000; break; // AEGEAN NUMBER FORTY THOUSAND |
|
241 |
case 0x1012F: retval = 50000; break; // AEGEAN NUMBER FIFTY THOUSAND |
|
242 |
case 0x10130: retval = 60000; break; // AEGEAN NUMBER SIXTY THOUSAND |
|
243 |
case 0x10131: retval = 70000; break; // AEGEAN NUMBER SEVENTY THOUSAND |
|
244 |
case 0x10132: retval = 80000; break; // AEGEAN NUMBER EIGHTY THOUSAND |
|
245 |
case 0x10133: retval = 90000; break; // AEGEAN NUMBER NINETY THOUSAND |
|
33242 | 246 |
case 0x10144: retval = 50; break; // GREEK ACROPHONIC ATTIC FIFTY |
247 |
case 0x10145: retval = 500; break; // GREEK ACROPHONIC ATTIC FIVE HUNDRED |
|
248 |
case 0x10146: retval = 5000; break; // GREEK ACROPHONIC ATTIC FIVE THOUSAND |
|
249 |
case 0x10147: retval = 50000; break; // GREEK ACROPHONIC ATTIC FIFTY THOUSAND |
|
250 |
case 0x1014A: retval = 50; break; // GREEK ACROPHONIC ATTIC FIFTY TALENTS |
|
251 |
case 0x1014B: retval = 100; break; // GREEK ACROPHONIC ATTIC ONE HUNDRED TALENTS |
|
252 |
case 0x1014C: retval = 500; break; // GREEK ACROPHONIC ATTIC FIVE HUNDRED TALENTS |
|
253 |
case 0x1014D: retval = 1000; break; // GREEK ACROPHONIC ATTIC ONE THOUSAND TALENTS |
|
254 |
case 0x1014E: retval = 5000; break; // GREEK ACROPHONIC ATTIC FIVE THOUSAND TALENTS |
|
255 |
case 0x10151: retval = 50; break; // GREEK ACROPHONIC ATTIC FIFTY STATERS |
|
256 |
case 0x10152: retval = 100; break; // GREEK ACROPHONIC ATTIC ONE HUNDRED STATERS |
|
257 |
case 0x10153: retval = 500; break; // GREEK ACROPHONIC ATTIC FIVE HUNDRED STATERS |
|
258 |
case 0x10154: retval = 1000; break; // GREEK ACROPHONIC ATTIC ONE THOUSAND STATERS |
|
259 |
case 0x10155: retval = 10000; break; // GREEK ACROPHONIC ATTIC TEN THOUSAND STATERS |
|
260 |
case 0x10156: retval = 50000; break; // GREEK ACROPHONIC ATTIC FIFTY THOUSAND STATERS |
|
261 |
case 0x10166: retval = 50; break; // GREEK ACROPHONIC TROEZENIAN FIFTY |
|
262 |
case 0x10167: retval = 50; break; // GREEK ACROPHONIC TROEZENIAN FIFTY ALTERNATE FORM |
|
263 |
case 0x10168: retval = 50; break; // GREEK ACROPHONIC HERMIONIAN FIFTY |
|
264 |
case 0x10169: retval = 50; break; // GREEK ACROPHONIC THESPIAN FIFTY |
|
265 |
case 0x1016A: retval = 100; break; // GREEK ACROPHONIC THESPIAN ONE HUNDRED |
|
266 |
case 0x1016B: retval = 300; break; // GREEK ACROPHONIC THESPIAN THREE HUNDRED |
|
267 |
case 0x1016C: retval = 500; break; // GREEK ACROPHONIC EPIDAUREAN FIVE HUNDRED |
|
268 |
case 0x1016D: retval = 500; break; // GREEK ACROPHONIC TROEZENIAN FIVE HUNDRED |
|
269 |
case 0x1016E: retval = 500; break; // GREEK ACROPHONIC THESPIAN FIVE HUNDRED |
|
270 |
case 0x1016F: retval = 500; break; // GREEK ACROPHONIC CARYSTIAN FIVE HUNDRED |
|
271 |
case 0x10170: retval = 500; break; // GREEK ACROPHONIC NAXIAN FIVE HUNDRED |
|
272 |
case 0x10171: retval = 1000; break; // GREEK ACROPHONIC THESPIAN ONE THOUSAND |
|
273 |
case 0x10172: retval = 5000; break; // GREEK ACROPHONIC THESPIAN FIVE THOUSAND |
|
274 |
case 0x10174: retval = 50; break; // GREEK ACROPHONIC STRATIAN FIFTY MNAS |
|
31680 | 275 |
case 0x102ED: retval = 40; break; // COPTIC EPACT NUMBER FORTY |
276 |
case 0x102EE: retval = 50; break; // COPTIC EPACT NUMBER FIFTY |
|
277 |
case 0x102EF: retval = 60; break; // COPTIC EPACT NUMBER SIXTY |
|
278 |
case 0x102F0: retval = 70; break; // COPTIC EPACT NUMBER SEVENTY |
|
279 |
case 0x102F1: retval = 80; break; // COPTIC EPACT NUMBER EIGHTY |
|
280 |
case 0x102F2: retval = 90; break; // COPTIC EPACT NUMBER NINETY |
|
281 |
case 0x102F3: retval = 100; break; // COPTIC EPACT NUMBER ONE HUNDRED |
|
282 |
case 0x102F4: retval = 200; break; // COPTIC EPACT NUMBER TWO HUNDRED |
|
283 |
case 0x102F5: retval = 300; break; // COPTIC EPACT NUMBER THREE HUNDRED |
|
284 |
case 0x102F6: retval = 400; break; // COPTIC EPACT NUMBER FOUR HUNDRED |
|
285 |
case 0x102F7: retval = 500; break; // COPTIC EPACT NUMBER FIVE HUNDRED |
|
286 |
case 0x102F8: retval = 600; break; // COPTIC EPACT NUMBER SIX HUNDRED |
|
287 |
case 0x102F9: retval = 700; break; // COPTIC EPACT NUMBER SEVEN HUNDRED |
|
288 |
case 0x102FA: retval = 800; break; // COPTIC EPACT NUMBER EIGHT HUNDRED |
|
289 |
case 0x102FB: retval = 900; break; // COPTIC EPACT NUMBER NINE HUNDRED |
|
33242 | 290 |
case 0x10323: retval = 50; break; // OLD ITALIC NUMERAL FIFTY |
31680 | 291 |
case 0x10341: retval = 90; break; // GOTHIC LETTER NINETY |
292 |
case 0x1034A: retval = 900; break; // GOTHIC LETTER NINE HUNDRED |
|
293 |
case 0x103D5: retval = 100; break; // OLD PERSIAN NUMBER HUNDRED |
|
294 |
case 0x1085D: retval = 100; break; // IMPERIAL ARAMAIC NUMBER ONE HUNDRED |
|
295 |
case 0x1085E: retval = 1000; break; // IMPERIAL ARAMAIC NUMBER ONE THOUSAND |
|
296 |
case 0x1085F: retval = 10000; break; // IMPERIAL ARAMAIC NUMBER TEN THOUSAND |
|
297 |
case 0x108AF: retval = 100; break; // NABATAEAN NUMBER ONE HUNDRED |
|
33242 | 298 |
case 0x108FF: retval = 100; break; // HATRAN NUMBER ONE HUNDRED |
31680 | 299 |
case 0x10919: retval = 100; break; // PHOENICIAN NUMBER ONE HUNDRED |
33242 | 300 |
case 0x109CC: retval = 40; break; // MEROITIC CURSIVE NUMBER FORTY |
301 |
case 0x109CD: retval = 50; break; // MEROITIC CURSIVE NUMBER FIFTY |
|
302 |
case 0x109CE: retval = 60; break; // MEROITIC CURSIVE NUMBER SIXTY |
|
303 |
case 0x109CF: retval = 70; break; // MEROITIC CURSIVE NUMBER SEVENTY |
|
304 |
case 0x109D2: retval = 100; break; // MEROITIC CURSIVE NUMBER ONE HUNDRED |
|
305 |
case 0x109D3: retval = 200; break; // MEROITIC CURSIVE NUMBER TWO HUNDRED |
|
306 |
case 0x109D4: retval = 300; break; // MEROITIC CURSIVE NUMBER THREE HUNDRED |
|
307 |
case 0x109D5: retval = 400; break; // MEROITIC CURSIVE NUMBER FOUR HUNDRED |
|
308 |
case 0x109D6: retval = 500; break; // MEROITIC CURSIVE NUMBER FIVE HUNDRED |
|
309 |
case 0x109D7: retval = 600; break; // MEROITIC CURSIVE NUMBER SIX HUNDRED |
|
310 |
case 0x109D8: retval = 700; break; // MEROITIC CURSIVE NUMBER SEVEN HUNDRED |
|
311 |
case 0x109D9: retval = 800; break; // MEROITIC CURSIVE NUMBER EIGHT HUNDRED |
|
312 |
case 0x109DA: retval = 900; break; // MEROITIC CURSIVE NUMBER NINE HUNDRED |
|
313 |
case 0x109DB: retval = 1000; break; // MEROITIC CURSIVE NUMBER ONE THOUSAND |
|
314 |
case 0x109DC: retval = 2000; break; // MEROITIC CURSIVE NUMBER TWO THOUSAND |
|
315 |
case 0x109DD: retval = 3000; break; // MEROITIC CURSIVE NUMBER THREE THOUSAND |
|
316 |
case 0x109DE: retval = 4000; break; // MEROITIC CURSIVE NUMBER FOUR THOUSAND |
|
317 |
case 0x109DF: retval = 5000; break; // MEROITIC CURSIVE NUMBER FIVE THOUSAND |
|
318 |
case 0x109E0: retval = 6000; break; // MEROITIC CURSIVE NUMBER SIX THOUSAND |
|
319 |
case 0x109E1: retval = 7000; break; // MEROITIC CURSIVE NUMBER SEVEN THOUSAND |
|
320 |
case 0x109E2: retval = 8000; break; // MEROITIC CURSIVE NUMBER EIGHT THOUSAND |
|
321 |
case 0x109E3: retval = 9000; break; // MEROITIC CURSIVE NUMBER NINE THOUSAND |
|
322 |
case 0x109E4: retval = 10000; break; // MEROITIC CURSIVE NUMBER TEN THOUSAND |
|
323 |
case 0x109E5: retval = 20000; break; // MEROITIC CURSIVE NUMBER TWENTY THOUSAND |
|
324 |
case 0x109E6: retval = 30000; break; // MEROITIC CURSIVE NUMBER THIRTY THOUSAND |
|
325 |
case 0x109E7: retval = 40000; break; // MEROITIC CURSIVE NUMBER FORTY THOUSAND |
|
326 |
case 0x109E8: retval = 50000; break; // MEROITIC CURSIVE NUMBER FIFTY THOUSAND |
|
327 |
case 0x109E9: retval = 60000; break; // MEROITIC CURSIVE NUMBER SIXTY THOUSAND |
|
328 |
case 0x109EA: retval = 70000; break; // MEROITIC CURSIVE NUMBER SEVENTY THOUSAND |
|
329 |
case 0x109EB: retval = 80000; break; // MEROITIC CURSIVE NUMBER EIGHTY THOUSAND |
|
330 |
case 0x109EC: retval = 90000; break; // MEROITIC CURSIVE NUMBER NINETY THOUSAND |
|
331 |
case 0x109ED: retval = 100000; break; // MEROITIC CURSIVE NUMBER ONE HUNDRED THOUSAND |
|
332 |
case 0x109EE: retval = 200000; break; // MEROITIC CURSIVE NUMBER TWO HUNDRED THOUSAND |
|
333 |
case 0x109EF: retval = 300000; break; // MEROITIC CURSIVE NUMBER THREE HUNDRED THOUSAND |
|
334 |
case 0x109F0: retval = 400000; break; // MEROITIC CURSIVE NUMBER FOUR HUNDRED THOUSAND |
|
335 |
case 0x109F1: retval = 500000; break; // MEROITIC CURSIVE NUMBER FIVE HUNDRED THOUSAND |
|
336 |
case 0x109F2: retval = 600000; break; // MEROITIC CURSIVE NUMBER SIX HUNDRED THOUSAND |
|
337 |
case 0x109F3: retval = 700000; break; // MEROITIC CURSIVE NUMBER SEVEN HUNDRED THOUSAND |
|
338 |
case 0x109F4: retval = 800000; break; // MEROITIC CURSIVE NUMBER EIGHT HUNDRED THOUSAND |
|
339 |
case 0x109F5: retval = 900000; break; // MEROITIC CURSIVE NUMBER NINE HUNDRED THOUSAND |
|
31680 | 340 |
case 0x10A46: retval = 100; break; // KHAROSHTHI NUMBER ONE HUNDRED |
341 |
case 0x10A47: retval = 1000; break; // KHAROSHTHI NUMBER ONE THOUSAND |
|
342 |
case 0x10A7E: retval = 50; break; // OLD SOUTH ARABIAN NUMBER FIFTY |
|
343 |
case 0x10AEF: retval = 100; break; // MANICHAEAN NUMBER ONE HUNDRED |
|
344 |
case 0x10B5E: retval = 100; break; // INSCRIPTIONAL PARTHIAN NUMBER ONE HUNDRED |
|
345 |
case 0x10B5F: retval = 1000; break; // INSCRIPTIONAL PARTHIAN NUMBER ONE THOUSAND |
|
346 |
case 0x10B7E: retval = 100; break; // INSCRIPTIONAL PAHLAVI NUMBER ONE HUNDRED |
|
347 |
case 0x10B7F: retval = 1000; break; // INSCRIPTIONAL PAHLAVI NUMBER ONE THOUSAND |
|
348 |
case 0x10BAF: retval = 100; break; // PSALTER PAHLAVI NUMBER ONE HUNDRED |
|
33242 | 349 |
case 0x10CFD: retval = 50; break; // OLD HUNGARIAN NUMBER FIFTY |
350 |
case 0x10CFE: retval = 100; break; // OLD HUNGARIAN NUMBER ONE HUNDRED |
|
351 |
case 0x10CFF: retval = 1000; break; // OLD HUNGARIAN NUMBER ONE THOUSAND |
|
31680 | 352 |
case 0x10E6C: retval = 40; break; // RUMI NUMBER FORTY |
353 |
case 0x10E6D: retval = 50; break; // RUMI NUMBER FIFTY |
|
354 |
case 0x10E6E: retval = 60; break; // RUMI NUMBER SIXTY |
|
355 |
case 0x10E6F: retval = 70; break; // RUMI NUMBER SEVENTY |
|
356 |
case 0x10E70: retval = 80; break; // RUMI NUMBER EIGHTY |
|
357 |
case 0x10E71: retval = 90; break; // RUMI NUMBER NINETY |
|
358 |
case 0x10E72: retval = 100; break; // RUMI NUMBER ONE HUNDRED |
|
359 |
case 0x10E73: retval = 200; break; // RUMI NUMBER TWO HUNDRED |
|
360 |
case 0x10E74: retval = 300; break; // RUMI NUMBER THREE HUNDRED |
|
361 |
case 0x10E75: retval = 400; break; // RUMI NUMBER FOUR HUNDRED |
|
362 |
case 0x10E76: retval = 500; break; // RUMI NUMBER FIVE HUNDRED |
|
363 |
case 0x10E77: retval = 600; break; // RUMI NUMBER SIX HUNDRED |
|
364 |
case 0x10E78: retval = 700; break; // RUMI NUMBER SEVEN HUNDRED |
|
365 |
case 0x10E79: retval = 800; break; // RUMI NUMBER EIGHT HUNDRED |
|
366 |
case 0x10E7A: retval = 900; break; // RUMI NUMBER NINE HUNDRED |
|
367 |
case 0x1105E: retval = 40; break; // BRAHMI NUMBER FORTY |
|
368 |
case 0x1105F: retval = 50; break; // BRAHMI NUMBER FIFTY |
|
369 |
case 0x11060: retval = 60; break; // BRAHMI NUMBER SIXTY |
|
370 |
case 0x11061: retval = 70; break; // BRAHMI NUMBER SEVENTY |
|
371 |
case 0x11062: retval = 80; break; // BRAHMI NUMBER EIGHTY |
|
372 |
case 0x11063: retval = 90; break; // BRAHMI NUMBER NINETY |
|
373 |
case 0x11064: retval = 100; break; // BRAHMI NUMBER ONE HUNDRED |
|
374 |
case 0x11065: retval = 1000; break; // BRAHMI NUMBER ONE THOUSAND |
|
375 |
case 0x111ED: retval = 40; break; // SINHALA ARCHAIC NUMBER FORTY |
|
376 |
case 0x111EE: retval = 50; break; // SINHALA ARCHAIC NUMBER FIFTY |
|
377 |
case 0x111EF: retval = 60; break; // SINHALA ARCHAIC NUMBER SIXTY |
|
378 |
case 0x111F0: retval = 70; break; // SINHALA ARCHAIC NUMBER SEVENTY |
|
379 |
case 0x111F1: retval = 80; break; // SINHALA ARCHAIC NUMBER EIGHTY |
|
380 |
case 0x111F2: retval = 90; break; // SINHALA ARCHAIC NUMBER NINETY |
|
381 |
case 0x111F3: retval = 100; break; // SINHALA ARCHAIC NUMBER ONE HUNDRED |
|
382 |
case 0x111F4: retval = 1000; break; // SINHALA ARCHAIC NUMBER ONE THOUSAND |
|
383 |
case 0x118ED: retval = 40; break; // WARANG CITI NUMBER FORTY |
|
384 |
case 0x118EE: retval = 50; break; // WARANG CITI NUMBER FIFTY |
|
385 |
case 0x118EF: retval = 60; break; // WARANG CITI NUMBER SIXTY |
|
386 |
case 0x118F0: retval = 70; break; // WARANG CITI NUMBER SEVENTY |
|
387 |
case 0x118F1: retval = 80; break; // WARANG CITI NUMBER EIGHTY |
|
388 |
case 0x118F2: retval = 90; break; // WARANG CITI NUMBER NINETY |
|
389 |
case 0x12432: retval = 216000; break; // CUNEIFORM NUMERIC SIGN SHAR2 TIMES GAL PLUS DISH |
|
390 |
case 0x12433: retval = 432000; break; // CUNEIFORM NUMERIC SIGN SHAR2 TIMES GAL PLUS MIN |
|
391 |
case 0x12467: retval = 40; break; // CUNEIFORM NUMERIC SIGN ELAMITE FORTY |
|
392 |
case 0x12468: retval = 50; break; // CUNEIFORM NUMERIC SIGN ELAMITE FIFTY |
|
393 |
case 0x16B5C: retval = 100; break; // PAHAWH HMONG NUMBER HUNDREDS |
|
394 |
case 0x16B5D: retval = 10000; break; // PAHAWH HMONG NUMBER TEN THOUSANDS |
|
395 |
case 0x16B5E: retval = 1000000; break; // PAHAWH HMONG NUMBER MILLIONS |
|
396 |
case 0x16B5F: retval = 100000000; break;// PAHAWH HMONG NUMBER HUNDRED MILLIONS |
|
397 |
case 0x1D36C: retval = 40; break; // COUNTING ROD TENS DIGIT FOUR |
|
398 |
case 0x1D36D: retval = 50; break; // COUNTING ROD TENS DIGIT FIVE |
|
399 |
case 0x1D36E: retval = 60; break; // COUNTING ROD TENS DIGIT SIX |
|
400 |
case 0x1D36F: retval = 70; break; // COUNTING ROD TENS DIGIT SEVEN |
|
401 |
case 0x1D370: retval = 80; break; // COUNTING ROD TENS DIGIT EIGHT |
|
402 |
case 0x1D371: retval = 90; break; // COUNTING ROD TENS DIGIT NINE |
|
2 | 403 |
default: retval = -2; break; |
404 |
} |
|
405 |
||
406 |
break; |
|
407 |
case ($$valueJavaSupradecimal): // Java supradecimal |
|
408 |
retval = (ch + ((val & $$maskDigitOffset) >> $$shiftDigitOffset) & $$maskDigit) + 10; |
|
409 |
break; |
|
410 |
} |
|
411 |
return retval; |
|
412 |
} |
|
413 |
||
414 |
boolean isWhitespace(int ch) { |
|
415 |
int props = getProperties(ch); |
|
416 |
return ((props & $$maskIdentifierInfo) == $$valueJavaWhitespace); |
|
417 |
} |
|
418 |
||
419 |
byte getDirectionality(int ch) { |
|
420 |
int val = getProperties(ch); |
|
421 |
byte directionality = (byte)((val & $$maskBidi) >> $$shiftBidi); |
|
422 |
if (directionality == 0xF ) { |
|
423 |
directionality = Character.DIRECTIONALITY_UNDEFINED; |
|
424 |
} |
|
425 |
return directionality; |
|
426 |
} |
|
427 |
||
428 |
boolean isMirrored(int ch) { |
|
429 |
int props = getProperties(ch); |
|
430 |
return ((props & $$maskMirrored) != 0); |
|
431 |
} |
|
432 |
||
433 |
static final CharacterData instance = new CharacterData01(); |
|
434 |
private CharacterData01() {}; |
|
435 |
||
436 |
$$Tables |
|
437 |
||
438 |
static { |
|
439 |
$$Initializers |
|
440 |
} |
|
441 |
} |