jdk/src/share/classes/java/text/CollationRules.java
author alanb
Thu, 18 Aug 2011 16:47:20 +0100
changeset 10347 1c9efe1ec7d3
parent 5506 202f599c92aa
permissions -rw-r--r--
7015589: (spec) BufferedWriter.close leaves stream open if close of underlying Writer fails Reviewed-by: forax, mduigou
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
     1
/*
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
     2
 * Copyright (c) 1996, 2001, Oracle and/or its affiliates. All rights reserved.
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
90ce3da70b43 Initial load
duke
parents:
diff changeset
     4
 *
90ce3da70b43 Initial load
duke
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
90ce3da70b43 Initial load
duke
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
     7
 * published by the Free Software Foundation.  Oracle designates this
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
     8
 * particular file as subject to the "Classpath" exception as provided
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
     9
 * by Oracle in the LICENSE file that accompanied this code.
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
    10
 *
90ce3da70b43 Initial load
duke
parents:
diff changeset
    11
 * This code is distributed in the hope that it will be useful, but WITHOUT
90ce3da70b43 Initial load
duke
parents:
diff changeset
    12
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
90ce3da70b43 Initial load
duke
parents:
diff changeset
    13
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
90ce3da70b43 Initial load
duke
parents:
diff changeset
    14
 * version 2 for more details (a copy is included in the LICENSE file that
90ce3da70b43 Initial load
duke
parents:
diff changeset
    15
 * accompanied this code).
90ce3da70b43 Initial load
duke
parents:
diff changeset
    16
 *
90ce3da70b43 Initial load
duke
parents:
diff changeset
    17
 * You should have received a copy of the GNU General Public License version
90ce3da70b43 Initial load
duke
parents:
diff changeset
    18
 * 2 along with this work; if not, write to the Free Software Foundation,
90ce3da70b43 Initial load
duke
parents:
diff changeset
    19
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
90ce3da70b43 Initial load
duke
parents:
diff changeset
    20
 *
5506
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
    21
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
    22
 * or visit www.oracle.com if you need additional information or have any
202f599c92aa 6943119: Rebrand source copyright notices
ohair
parents: 2
diff changeset
    23
 * questions.
2
90ce3da70b43 Initial load
duke
parents:
diff changeset
    24
 */
90ce3da70b43 Initial load
duke
parents:
diff changeset
    25
90ce3da70b43 Initial load
duke
parents:
diff changeset
    26
/*
90ce3da70b43 Initial load
duke
parents:
diff changeset
    27
 * (C) Copyright Taligent, Inc. 1996,1997 - All Rights Reserved
90ce3da70b43 Initial load
duke
parents:
diff changeset
    28
 * (C) Copyright IBM Corp. 1996, 1997 - All Rights Reserved
90ce3da70b43 Initial load
duke
parents:
diff changeset
    29
 *
90ce3da70b43 Initial load
duke
parents:
diff changeset
    30
 *   The original version of this source code and documentation is copyrighted
90ce3da70b43 Initial load
duke
parents:
diff changeset
    31
 * and owned by Taligent, Inc., a wholly-owned subsidiary of IBM. These
90ce3da70b43 Initial load
duke
parents:
diff changeset
    32
 * materials are provided under terms of a License Agreement between Taligent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    33
 * and Sun. This technology is protected by multiple US and International
90ce3da70b43 Initial load
duke
parents:
diff changeset
    34
 * patents. This notice and attribution to Taligent may not be removed.
90ce3da70b43 Initial load
duke
parents:
diff changeset
    35
 *   Taligent is a registered trademark of Taligent, Inc.
90ce3da70b43 Initial load
duke
parents:
diff changeset
    36
 *
90ce3da70b43 Initial load
duke
parents:
diff changeset
    37
 */
90ce3da70b43 Initial load
duke
parents:
diff changeset
    38
90ce3da70b43 Initial load
duke
parents:
diff changeset
    39
package java.text;
90ce3da70b43 Initial load
duke
parents:
diff changeset
    40
/**
90ce3da70b43 Initial load
duke
parents:
diff changeset
    41
 * CollationRules contains the default en_US collation rules as a base
90ce3da70b43 Initial load
duke
parents:
diff changeset
    42
 * for building other collation tables.
90ce3da70b43 Initial load
duke
parents:
diff changeset
    43
 * <p>Note that decompositions are done before these rules are used,
90ce3da70b43 Initial load
duke
parents:
diff changeset
    44
 * so they do not have to contain accented characters, such as A-grave.
90ce3da70b43 Initial load
duke
parents:
diff changeset
    45
 * @see                RuleBasedCollator
90ce3da70b43 Initial load
duke
parents:
diff changeset
    46
 * @see                LocaleElements
90ce3da70b43 Initial load
duke
parents:
diff changeset
    47
 * @author             Helena Shih, Mark Davis
90ce3da70b43 Initial load
duke
parents:
diff changeset
    48
 */
90ce3da70b43 Initial load
duke
parents:
diff changeset
    49
final class CollationRules {
90ce3da70b43 Initial load
duke
parents:
diff changeset
    50
    final static String DEFAULTRULES = new String(
90ce3da70b43 Initial load
duke
parents:
diff changeset
    51
        "" // no FRENCH accent order by default, add in French Delta
90ce3da70b43 Initial load
duke
parents:
diff changeset
    52
        // IGNORABLES (up to first < character)
90ce3da70b43 Initial load
duke
parents:
diff changeset
    53
        // COMPLETELY IGNORE format characters
90ce3da70b43 Initial load
duke
parents:
diff changeset
    54
        + "='\u200B'=\u200C=\u200D=\u200E=\u200F"
90ce3da70b43 Initial load
duke
parents:
diff changeset
    55
        // Control Characters
90ce3da70b43 Initial load
duke
parents:
diff changeset
    56
        + "=\u0000 =\u0001 =\u0002 =\u0003 =\u0004" //null, .. eot
90ce3da70b43 Initial load
duke
parents:
diff changeset
    57
        + "=\u0005 =\u0006 =\u0007 =\u0008 ='\u0009'" //enq, ...
90ce3da70b43 Initial load
duke
parents:
diff changeset
    58
        + "='\u000b' =\u000e" //vt,, so
90ce3da70b43 Initial load
duke
parents:
diff changeset
    59
        + "=\u000f ='\u0010' =\u0011 =\u0012 =\u0013" //si, dle, dc1, dc2, dc3
90ce3da70b43 Initial load
duke
parents:
diff changeset
    60
        + "=\u0014 =\u0015 =\u0016 =\u0017 =\u0018" //dc4, nak, syn, etb, can
90ce3da70b43 Initial load
duke
parents:
diff changeset
    61
        + "=\u0019 =\u001a =\u001b =\u001c =\u001d" //em, sub, esc, fs, gs
90ce3da70b43 Initial load
duke
parents:
diff changeset
    62
        + "=\u001e =\u001f =\u007f"                   //rs, us, del
90ce3da70b43 Initial load
duke
parents:
diff changeset
    63
        //....then the C1 Latin 1 reserved control codes
90ce3da70b43 Initial load
duke
parents:
diff changeset
    64
        + "=\u0080 =\u0081 =\u0082 =\u0083 =\u0084 =\u0085"
90ce3da70b43 Initial load
duke
parents:
diff changeset
    65
        + "=\u0086 =\u0087 =\u0088 =\u0089 =\u008a =\u008b"
90ce3da70b43 Initial load
duke
parents:
diff changeset
    66
        + "=\u008c =\u008d =\u008e =\u008f =\u0090 =\u0091"
90ce3da70b43 Initial load
duke
parents:
diff changeset
    67
        + "=\u0092 =\u0093 =\u0094 =\u0095 =\u0096 =\u0097"
90ce3da70b43 Initial load
duke
parents:
diff changeset
    68
        + "=\u0098 =\u0099 =\u009a =\u009b =\u009c =\u009d"
90ce3da70b43 Initial load
duke
parents:
diff changeset
    69
        + "=\u009e =\u009f"
90ce3da70b43 Initial load
duke
parents:
diff changeset
    70
        // IGNORE except for secondary, tertiary difference
90ce3da70b43 Initial load
duke
parents:
diff changeset
    71
        // Spaces
90ce3da70b43 Initial load
duke
parents:
diff changeset
    72
        + ";'\u0020';'\u00A0'"                  // spaces
90ce3da70b43 Initial load
duke
parents:
diff changeset
    73
        + ";'\u2000';'\u2001';'\u2002';'\u2003';'\u2004'"  // spaces
90ce3da70b43 Initial load
duke
parents:
diff changeset
    74
        + ";'\u2005';'\u2006';'\u2007';'\u2008';'\u2009'"  // spaces
90ce3da70b43 Initial load
duke
parents:
diff changeset
    75
        + ";'\u200A';'\u3000';'\uFEFF'"                // spaces
90ce3da70b43 Initial load
duke
parents:
diff changeset
    76
        + ";'\r' ;'\t' ;'\n';'\f';'\u000b'"  // whitespace
90ce3da70b43 Initial load
duke
parents:
diff changeset
    77
90ce3da70b43 Initial load
duke
parents:
diff changeset
    78
        // Non-spacing accents
90ce3da70b43 Initial load
duke
parents:
diff changeset
    79
90ce3da70b43 Initial load
duke
parents:
diff changeset
    80
        + ";\u0301"          // non-spacing acute accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    81
        + ";\u0300"          // non-spacing grave accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    82
        + ";\u0306"          // non-spacing breve accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    83
        + ";\u0302"          // non-spacing circumflex accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    84
        + ";\u030c"          // non-spacing caron/hacek accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    85
        + ";\u030a"          // non-spacing ring above accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    86
        + ";\u030d"          // non-spacing vertical line above
90ce3da70b43 Initial load
duke
parents:
diff changeset
    87
        + ";\u0308"          // non-spacing diaeresis accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    88
        + ";\u030b"          // non-spacing double acute accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    89
        + ";\u0303"          // non-spacing tilde accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    90
        + ";\u0307"          // non-spacing dot above/overdot accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    91
        + ";\u0304"          // non-spacing macron accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    92
        + ";\u0337"          // non-spacing short slash overlay (overstruck diacritic)
90ce3da70b43 Initial load
duke
parents:
diff changeset
    93
        + ";\u0327"          // non-spacing cedilla accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    94
        + ";\u0328"          // non-spacing ogonek accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    95
        + ";\u0323"          // non-spacing dot-below/underdot accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    96
        + ";\u0332"          // non-spacing underscore/underline accent
90ce3da70b43 Initial load
duke
parents:
diff changeset
    97
        // with the rest of the general diacritical marks in binary order
90ce3da70b43 Initial load
duke
parents:
diff changeset
    98
        + ";\u0305"          // non-spacing overscore/overline
90ce3da70b43 Initial load
duke
parents:
diff changeset
    99
        + ";\u0309"          // non-spacing hook above
90ce3da70b43 Initial load
duke
parents:
diff changeset
   100
        + ";\u030e"          // non-spacing double vertical line above
90ce3da70b43 Initial load
duke
parents:
diff changeset
   101
        + ";\u030f"          // non-spacing double grave
90ce3da70b43 Initial load
duke
parents:
diff changeset
   102
        + ";\u0310"          // non-spacing chandrabindu
90ce3da70b43 Initial load
duke
parents:
diff changeset
   103
        + ";\u0311"          // non-spacing inverted breve
90ce3da70b43 Initial load
duke
parents:
diff changeset
   104
        + ";\u0312"          // non-spacing turned comma above/cedilla above
90ce3da70b43 Initial load
duke
parents:
diff changeset
   105
        + ";\u0313"          // non-spacing comma above
90ce3da70b43 Initial load
duke
parents:
diff changeset
   106
        + ";\u0314"          // non-spacing reversed comma above
90ce3da70b43 Initial load
duke
parents:
diff changeset
   107
        + ";\u0315"          // non-spacing comma above right
90ce3da70b43 Initial load
duke
parents:
diff changeset
   108
        + ";\u0316"          // non-spacing grave below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   109
        + ";\u0317"          // non-spacing acute below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   110
        + ";\u0318"          // non-spacing left tack below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   111
        + ";\u0319"          // non-spacing tack below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   112
        + ";\u031a"          // non-spacing left angle above
90ce3da70b43 Initial load
duke
parents:
diff changeset
   113
        + ";\u031b"          // non-spacing horn
90ce3da70b43 Initial load
duke
parents:
diff changeset
   114
        + ";\u031c"          // non-spacing left half ring below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   115
        + ";\u031d"          // non-spacing up tack below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   116
        + ";\u031e"          // non-spacing down tack below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   117
        + ";\u031f"          // non-spacing plus sign below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   118
        + ";\u0320"          // non-spacing minus sign below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   119
        + ";\u0321"          // non-spacing palatalized hook below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   120
        + ";\u0322"          // non-spacing retroflex hook below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   121
        + ";\u0324"          // non-spacing double dot below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   122
        + ";\u0325"          // non-spacing ring below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   123
        + ";\u0326"          // non-spacing comma below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   124
        + ";\u0329"          // non-spacing vertical line below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   125
        + ";\u032a"          // non-spacing bridge below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   126
        + ";\u032b"          // non-spacing inverted double arch below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   127
        + ";\u032c"          // non-spacing hacek below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   128
        + ";\u032d"          // non-spacing circumflex below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   129
        + ";\u032e"          // non-spacing breve below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   130
        + ";\u032f"          // non-spacing inverted breve below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   131
        + ";\u0330"          // non-spacing tilde below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   132
        + ";\u0331"          // non-spacing macron below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   133
        + ";\u0333"          // non-spacing double underscore
90ce3da70b43 Initial load
duke
parents:
diff changeset
   134
        + ";\u0334"          // non-spacing tilde overlay
90ce3da70b43 Initial load
duke
parents:
diff changeset
   135
        + ";\u0335"          // non-spacing short bar overlay
90ce3da70b43 Initial load
duke
parents:
diff changeset
   136
        + ";\u0336"          // non-spacing long bar overlay
90ce3da70b43 Initial load
duke
parents:
diff changeset
   137
        + ";\u0338"          // non-spacing long slash overlay
90ce3da70b43 Initial load
duke
parents:
diff changeset
   138
        + ";\u0339"          // non-spacing right half ring below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   139
        + ";\u033a"          // non-spacing inverted bridge below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   140
        + ";\u033b"          // non-spacing square below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   141
        + ";\u033c"          // non-spacing seagull below
90ce3da70b43 Initial load
duke
parents:
diff changeset
   142
        + ";\u033d"          // non-spacing x above
90ce3da70b43 Initial load
duke
parents:
diff changeset
   143
        + ";\u033e"          // non-spacing vertical tilde
90ce3da70b43 Initial load
duke
parents:
diff changeset
   144
        + ";\u033f"          // non-spacing double overscore
90ce3da70b43 Initial load
duke
parents:
diff changeset
   145
        //+ ";\u0340"          // non-spacing grave tone mark == \u0300
90ce3da70b43 Initial load
duke
parents:
diff changeset
   146
        //+ ";\u0341"          // non-spacing acute tone mark == \u0301
90ce3da70b43 Initial load
duke
parents:
diff changeset
   147
        + ";\u0342;"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   148
        //+ "\u0343;" // == \u0313
90ce3da70b43 Initial load
duke
parents:
diff changeset
   149
        + "\u0344;\u0345;\u0360;\u0361"    // newer
90ce3da70b43 Initial load
duke
parents:
diff changeset
   150
        + ";\u0483;\u0484;\u0485;\u0486"    // Cyrillic accents
90ce3da70b43 Initial load
duke
parents:
diff changeset
   151
90ce3da70b43 Initial load
duke
parents:
diff changeset
   152
        + ";\u20D0;\u20D1;\u20D2"           // symbol accents
90ce3da70b43 Initial load
duke
parents:
diff changeset
   153
        + ";\u20D3;\u20D4;\u20D5"           // symbol accents
90ce3da70b43 Initial load
duke
parents:
diff changeset
   154
        + ";\u20D6;\u20D7;\u20D8"           // symbol accents
90ce3da70b43 Initial load
duke
parents:
diff changeset
   155
        + ";\u20D9;\u20DA;\u20DB"           // symbol accents
90ce3da70b43 Initial load
duke
parents:
diff changeset
   156
        + ";\u20DC;\u20DD;\u20DE"           // symbol accents
90ce3da70b43 Initial load
duke
parents:
diff changeset
   157
        + ";\u20DF;\u20E0;\u20E1"           // symbol accents
90ce3da70b43 Initial load
duke
parents:
diff changeset
   158
90ce3da70b43 Initial load
duke
parents:
diff changeset
   159
        + ",'\u002D';\u00AD"                // dashes
90ce3da70b43 Initial load
duke
parents:
diff changeset
   160
        + ";\u2010;\u2011;\u2012"           // dashes
90ce3da70b43 Initial load
duke
parents:
diff changeset
   161
        + ";\u2013;\u2014;\u2015"           // dashes
90ce3da70b43 Initial load
duke
parents:
diff changeset
   162
        + ";\u2212"                         // dashes
90ce3da70b43 Initial load
duke
parents:
diff changeset
   163
90ce3da70b43 Initial load
duke
parents:
diff changeset
   164
        // other punctuation
90ce3da70b43 Initial load
duke
parents:
diff changeset
   165
90ce3da70b43 Initial load
duke
parents:
diff changeset
   166
        + "<'\u005f'"        // underline/underscore (spacing)
90ce3da70b43 Initial load
duke
parents:
diff changeset
   167
        + "<\u00af"          // overline or macron (spacing)
90ce3da70b43 Initial load
duke
parents:
diff changeset
   168
        + "<'\u002c'"        // comma (spacing)
90ce3da70b43 Initial load
duke
parents:
diff changeset
   169
        + "<'\u003b'"        // semicolon
90ce3da70b43 Initial load
duke
parents:
diff changeset
   170
        + "<'\u003a'"        // colon
90ce3da70b43 Initial load
duke
parents:
diff changeset
   171
        + "<'\u0021'"        // exclamation point
90ce3da70b43 Initial load
duke
parents:
diff changeset
   172
        + "<\u00a1"          // inverted exclamation point
90ce3da70b43 Initial load
duke
parents:
diff changeset
   173
        + "<'\u003f'"        // question mark
90ce3da70b43 Initial load
duke
parents:
diff changeset
   174
        + "<\u00bf"          // inverted question mark
90ce3da70b43 Initial load
duke
parents:
diff changeset
   175
        + "<'\u002f'"        // slash
90ce3da70b43 Initial load
duke
parents:
diff changeset
   176
        + "<'\u002e'"        // period/full stop
90ce3da70b43 Initial load
duke
parents:
diff changeset
   177
        + "<\u00b4"          // acute accent (spacing)
90ce3da70b43 Initial load
duke
parents:
diff changeset
   178
        + "<'\u0060'"        // grave accent (spacing)
90ce3da70b43 Initial load
duke
parents:
diff changeset
   179
        + "<'\u005e'"        // circumflex accent (spacing)
90ce3da70b43 Initial load
duke
parents:
diff changeset
   180
        + "<\u00a8"          // diaresis/umlaut accent (spacing)
90ce3da70b43 Initial load
duke
parents:
diff changeset
   181
        + "<'\u007e'"        // tilde accent (spacing)
90ce3da70b43 Initial load
duke
parents:
diff changeset
   182
        + "<\u00b7"          // middle dot (spacing)
90ce3da70b43 Initial load
duke
parents:
diff changeset
   183
        + "<\u00b8"          // cedilla accent (spacing)
90ce3da70b43 Initial load
duke
parents:
diff changeset
   184
        + "<'\u0027'"        // apostrophe
90ce3da70b43 Initial load
duke
parents:
diff changeset
   185
        + "<'\"'"            // quotation marks
90ce3da70b43 Initial load
duke
parents:
diff changeset
   186
        + "<\u00ab"          // left angle quotes
90ce3da70b43 Initial load
duke
parents:
diff changeset
   187
        + "<\u00bb"          // right angle quotes
90ce3da70b43 Initial load
duke
parents:
diff changeset
   188
        + "<'\u0028'"        // left parenthesis
90ce3da70b43 Initial load
duke
parents:
diff changeset
   189
        + "<'\u0029'"        // right parenthesis
90ce3da70b43 Initial load
duke
parents:
diff changeset
   190
        + "<'\u005b'"        // left bracket
90ce3da70b43 Initial load
duke
parents:
diff changeset
   191
        + "<'\u005d'"        // right bracket
90ce3da70b43 Initial load
duke
parents:
diff changeset
   192
        + "<'\u007b'"        // left brace
90ce3da70b43 Initial load
duke
parents:
diff changeset
   193
        + "<'\u007d'"        // right brace
90ce3da70b43 Initial load
duke
parents:
diff changeset
   194
        + "<\u00a7"          // section symbol
90ce3da70b43 Initial load
duke
parents:
diff changeset
   195
        + "<\u00b6"          // paragraph symbol
90ce3da70b43 Initial load
duke
parents:
diff changeset
   196
        + "<\u00a9"          // copyright symbol
90ce3da70b43 Initial load
duke
parents:
diff changeset
   197
        + "<\u00ae"          // registered trademark symbol
90ce3da70b43 Initial load
duke
parents:
diff changeset
   198
        + "<'\u0040'"          // at sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   199
        + "<\u00a4"          // international currency symbol
90ce3da70b43 Initial load
duke
parents:
diff changeset
   200
        + "<\u0e3f"          // baht sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   201
        + "<\u00a2"          // cent sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   202
        + "<\u20a1"          // colon sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   203
        + "<\u20a2"          // cruzeiro sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   204
        + "<'\u0024'"        // dollar sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   205
        + "<\u20ab"          // dong sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   206
        + "<\u20ac"          // euro sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   207
        + "<\u20a3"          // franc sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   208
        + "<\u20a4"          // lira sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   209
        + "<\u20a5"          // mill sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   210
        + "<\u20a6"          // naira sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   211
        + "<\u20a7"          // peseta sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   212
        + "<\u00a3"          // pound-sterling sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   213
        + "<\u20a8"          // rupee sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   214
        + "<\u20aa"          // new shekel sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   215
        + "<\u20a9"          // won sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   216
        + "<\u00a5"          // yen sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   217
        + "<'\u002a'"        // asterisk
90ce3da70b43 Initial load
duke
parents:
diff changeset
   218
        + "<'\\'"            // backslash
90ce3da70b43 Initial load
duke
parents:
diff changeset
   219
        + "<'\u0026'"        // ampersand
90ce3da70b43 Initial load
duke
parents:
diff changeset
   220
        + "<'\u0023'"        // number sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   221
        + "<'\u0025'"        // percent sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   222
        + "<'\u002b'"        // plus sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   223
        + "<\u00b1"          // plus-or-minus sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   224
        + "<\u00f7"          // divide sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   225
        + "<\u00d7"          // multiply sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   226
        + "<'\u003c'"        // less-than sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   227
        + "<'\u003d'"        // equal sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   228
        + "<'\u003e'"        // greater-than sign
90ce3da70b43 Initial load
duke
parents:
diff changeset
   229
        + "<\u00ac"          // end of line symbol/logical NOT symbol
90ce3da70b43 Initial load
duke
parents:
diff changeset
   230
        + "<'\u007c'"          // vertical line/logical OR symbol
90ce3da70b43 Initial load
duke
parents:
diff changeset
   231
        + "<\u00a6"          // broken vertical line
90ce3da70b43 Initial load
duke
parents:
diff changeset
   232
        + "<\u00b0"          // degree symbol
90ce3da70b43 Initial load
duke
parents:
diff changeset
   233
        + "<\u00b5"          // micro symbol
90ce3da70b43 Initial load
duke
parents:
diff changeset
   234
90ce3da70b43 Initial load
duke
parents:
diff changeset
   235
        // NUMERICS
90ce3da70b43 Initial load
duke
parents:
diff changeset
   236
90ce3da70b43 Initial load
duke
parents:
diff changeset
   237
        + "<0<1<2<3<4<5<6<7<8<9"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   238
        + "<\u00bc<\u00bd<\u00be"   // 1/4,1/2,3/4 fractions
90ce3da70b43 Initial load
duke
parents:
diff changeset
   239
90ce3da70b43 Initial load
duke
parents:
diff changeset
   240
        // NON-IGNORABLES
90ce3da70b43 Initial load
duke
parents:
diff changeset
   241
        + "<a,A"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   242
        + "<b,B"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   243
        + "<c,C"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   244
        + "<d,D"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   245
        + "<\u00F0,\u00D0"                  // eth
90ce3da70b43 Initial load
duke
parents:
diff changeset
   246
        + "<e,E"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   247
        + "<f,F"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   248
        + "<g,G"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   249
        + "<h,H"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   250
        + "<i,I"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   251
        + "<j,J"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   252
        + "<k,K"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   253
        + "<l,L"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   254
        + "<m,M"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   255
        + "<n,N"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   256
        + "<o,O"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   257
        + "<p,P"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   258
        + "<q,Q"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   259
        + "<r,R"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   260
        + "<s, S & SS,\u00DF"             // s-zet
90ce3da70b43 Initial load
duke
parents:
diff changeset
   261
        + "<t,T"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   262
        + "& TH, \u00DE &TH, \u00FE "     // thorn
90ce3da70b43 Initial load
duke
parents:
diff changeset
   263
        + "<u,U"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   264
        + "<v,V"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   265
        + "<w,W"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   266
        + "<x,X"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   267
        + "<y,Y"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   268
        + "<z,Z"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   269
        + "&AE,\u00C6"                    // ae & AE ligature
90ce3da70b43 Initial load
duke
parents:
diff changeset
   270
        + "&AE,\u00E6"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   271
        + "&OE,\u0152"                    // oe & OE ligature
90ce3da70b43 Initial load
duke
parents:
diff changeset
   272
        + "&OE,\u0153"
90ce3da70b43 Initial load
duke
parents:
diff changeset
   273
    );
90ce3da70b43 Initial load
duke
parents:
diff changeset
   274
}