src/java.base/share/classes/java/util/regex/ASCII.java
changeset 47216 71c04702a3d5
parent 25859 3317bb8137f4
equal deleted inserted replaced
47215:4ebc2e2fb97c 47216:71c04702a3d5
       
     1 /*
       
     2  * Copyright (c) 1999, 2000, Oracle and/or its affiliates. All rights reserved.
       
     3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
       
     4  *
       
     5  * This code is free software; you can redistribute it and/or modify it
       
     6  * under the terms of the GNU General Public License version 2 only, as
       
     7  * published by the Free Software Foundation.  Oracle designates this
       
     8  * particular file as subject to the "Classpath" exception as provided
       
     9  * by Oracle in the LICENSE file that accompanied this code.
       
    10  *
       
    11  * This code is distributed in the hope that it will be useful, but WITHOUT
       
    12  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
       
    13  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
       
    14  * version 2 for more details (a copy is included in the LICENSE file that
       
    15  * accompanied this code).
       
    16  *
       
    17  * You should have received a copy of the GNU General Public License version
       
    18  * 2 along with this work; if not, write to the Free Software Foundation,
       
    19  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
       
    20  *
       
    21  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
       
    22  * or visit www.oracle.com if you need additional information or have any
       
    23  * questions.
       
    24  */
       
    25 
       
    26 package java.util.regex;
       
    27 
       
    28 
       
    29 /**
       
    30  * Utility class that implements the standard C ctype functionality.
       
    31  *
       
    32  * @author Hong Zhang
       
    33  */
       
    34 
       
    35 final class ASCII {
       
    36 
       
    37     static final int UPPER   = 0x00000100;
       
    38 
       
    39     static final int LOWER   = 0x00000200;
       
    40 
       
    41     static final int DIGIT   = 0x00000400;
       
    42 
       
    43     static final int SPACE   = 0x00000800;
       
    44 
       
    45     static final int PUNCT   = 0x00001000;
       
    46 
       
    47     static final int CNTRL   = 0x00002000;
       
    48 
       
    49     static final int BLANK   = 0x00004000;
       
    50 
       
    51     static final int HEX     = 0x00008000;
       
    52 
       
    53     static final int UNDER   = 0x00010000;
       
    54 
       
    55     static final int ASCII   = 0x0000FF00;
       
    56 
       
    57     static final int ALPHA   = (UPPER|LOWER);
       
    58 
       
    59     static final int ALNUM   = (UPPER|LOWER|DIGIT);
       
    60 
       
    61     static final int GRAPH   = (PUNCT|UPPER|LOWER|DIGIT);
       
    62 
       
    63     static final int WORD    = (UPPER|LOWER|UNDER|DIGIT);
       
    64 
       
    65     static final int XDIGIT  = (HEX);
       
    66 
       
    67     private static final int[] ctype = new int[] {
       
    68         CNTRL,                  /* 00 (NUL) */
       
    69         CNTRL,                  /* 01 (SOH) */
       
    70         CNTRL,                  /* 02 (STX) */
       
    71         CNTRL,                  /* 03 (ETX) */
       
    72         CNTRL,                  /* 04 (EOT) */
       
    73         CNTRL,                  /* 05 (ENQ) */
       
    74         CNTRL,                  /* 06 (ACK) */
       
    75         CNTRL,                  /* 07 (BEL) */
       
    76         CNTRL,                  /* 08 (BS)  */
       
    77         SPACE+CNTRL+BLANK,      /* 09 (HT)  */
       
    78         SPACE+CNTRL,            /* 0A (LF)  */
       
    79         SPACE+CNTRL,            /* 0B (VT)  */
       
    80         SPACE+CNTRL,            /* 0C (FF)  */
       
    81         SPACE+CNTRL,            /* 0D (CR)  */
       
    82         CNTRL,                  /* 0E (SI)  */
       
    83         CNTRL,                  /* 0F (SO)  */
       
    84         CNTRL,                  /* 10 (DLE) */
       
    85         CNTRL,                  /* 11 (DC1) */
       
    86         CNTRL,                  /* 12 (DC2) */
       
    87         CNTRL,                  /* 13 (DC3) */
       
    88         CNTRL,                  /* 14 (DC4) */
       
    89         CNTRL,                  /* 15 (NAK) */
       
    90         CNTRL,                  /* 16 (SYN) */
       
    91         CNTRL,                  /* 17 (ETB) */
       
    92         CNTRL,                  /* 18 (CAN) */
       
    93         CNTRL,                  /* 19 (EM)  */
       
    94         CNTRL,                  /* 1A (SUB) */
       
    95         CNTRL,                  /* 1B (ESC) */
       
    96         CNTRL,                  /* 1C (FS)  */
       
    97         CNTRL,                  /* 1D (GS)  */
       
    98         CNTRL,                  /* 1E (RS)  */
       
    99         CNTRL,                  /* 1F (US)  */
       
   100         SPACE+BLANK,            /* 20 SPACE */
       
   101         PUNCT,                  /* 21 !     */
       
   102         PUNCT,                  /* 22 "     */
       
   103         PUNCT,                  /* 23 #     */
       
   104         PUNCT,                  /* 24 $     */
       
   105         PUNCT,                  /* 25 %     */
       
   106         PUNCT,                  /* 26 &     */
       
   107         PUNCT,                  /* 27 '     */
       
   108         PUNCT,                  /* 28 (     */
       
   109         PUNCT,                  /* 29 )     */
       
   110         PUNCT,                  /* 2A *     */
       
   111         PUNCT,                  /* 2B +     */
       
   112         PUNCT,                  /* 2C ,     */
       
   113         PUNCT,                  /* 2D -     */
       
   114         PUNCT,                  /* 2E .     */
       
   115         PUNCT,                  /* 2F /     */
       
   116         DIGIT+HEX+0,            /* 30 0     */
       
   117         DIGIT+HEX+1,            /* 31 1     */
       
   118         DIGIT+HEX+2,            /* 32 2     */
       
   119         DIGIT+HEX+3,            /* 33 3     */
       
   120         DIGIT+HEX+4,            /* 34 4     */
       
   121         DIGIT+HEX+5,            /* 35 5     */
       
   122         DIGIT+HEX+6,            /* 36 6     */
       
   123         DIGIT+HEX+7,            /* 37 7     */
       
   124         DIGIT+HEX+8,            /* 38 8     */
       
   125         DIGIT+HEX+9,            /* 39 9     */
       
   126         PUNCT,                  /* 3A :     */
       
   127         PUNCT,                  /* 3B ;     */
       
   128         PUNCT,                  /* 3C <     */
       
   129         PUNCT,                  /* 3D =     */
       
   130         PUNCT,                  /* 3E >     */
       
   131         PUNCT,                  /* 3F ?     */
       
   132         PUNCT,                  /* 40 @     */
       
   133         UPPER+HEX+10,           /* 41 A     */
       
   134         UPPER+HEX+11,           /* 42 B     */
       
   135         UPPER+HEX+12,           /* 43 C     */
       
   136         UPPER+HEX+13,           /* 44 D     */
       
   137         UPPER+HEX+14,           /* 45 E     */
       
   138         UPPER+HEX+15,           /* 46 F     */
       
   139         UPPER+16,               /* 47 G     */
       
   140         UPPER+17,               /* 48 H     */
       
   141         UPPER+18,               /* 49 I     */
       
   142         UPPER+19,               /* 4A J     */
       
   143         UPPER+20,               /* 4B K     */
       
   144         UPPER+21,               /* 4C L     */
       
   145         UPPER+22,               /* 4D M     */
       
   146         UPPER+23,               /* 4E N     */
       
   147         UPPER+24,               /* 4F O     */
       
   148         UPPER+25,               /* 50 P     */
       
   149         UPPER+26,               /* 51 Q     */
       
   150         UPPER+27,               /* 52 R     */
       
   151         UPPER+28,               /* 53 S     */
       
   152         UPPER+29,               /* 54 T     */
       
   153         UPPER+30,               /* 55 U     */
       
   154         UPPER+31,               /* 56 V     */
       
   155         UPPER+32,               /* 57 W     */
       
   156         UPPER+33,               /* 58 X     */
       
   157         UPPER+34,               /* 59 Y     */
       
   158         UPPER+35,               /* 5A Z     */
       
   159         PUNCT,                  /* 5B [     */
       
   160         PUNCT,                  /* 5C \     */
       
   161         PUNCT,                  /* 5D ]     */
       
   162         PUNCT,                  /* 5E ^     */
       
   163         PUNCT|UNDER,            /* 5F _     */
       
   164         PUNCT,                  /* 60 `     */
       
   165         LOWER+HEX+10,           /* 61 a     */
       
   166         LOWER+HEX+11,           /* 62 b     */
       
   167         LOWER+HEX+12,           /* 63 c     */
       
   168         LOWER+HEX+13,           /* 64 d     */
       
   169         LOWER+HEX+14,           /* 65 e     */
       
   170         LOWER+HEX+15,           /* 66 f     */
       
   171         LOWER+16,               /* 67 g     */
       
   172         LOWER+17,               /* 68 h     */
       
   173         LOWER+18,               /* 69 i     */
       
   174         LOWER+19,               /* 6A j     */
       
   175         LOWER+20,               /* 6B k     */
       
   176         LOWER+21,               /* 6C l     */
       
   177         LOWER+22,               /* 6D m     */
       
   178         LOWER+23,               /* 6E n     */
       
   179         LOWER+24,               /* 6F o     */
       
   180         LOWER+25,               /* 70 p     */
       
   181         LOWER+26,               /* 71 q     */
       
   182         LOWER+27,               /* 72 r     */
       
   183         LOWER+28,               /* 73 s     */
       
   184         LOWER+29,               /* 74 t     */
       
   185         LOWER+30,               /* 75 u     */
       
   186         LOWER+31,               /* 76 v     */
       
   187         LOWER+32,               /* 77 w     */
       
   188         LOWER+33,               /* 78 x     */
       
   189         LOWER+34,               /* 79 y     */
       
   190         LOWER+35,               /* 7A z     */
       
   191         PUNCT,                  /* 7B {     */
       
   192         PUNCT,                  /* 7C |     */
       
   193         PUNCT,                  /* 7D }     */
       
   194         PUNCT,                  /* 7E ~     */
       
   195         CNTRL,                  /* 7F (DEL) */
       
   196     };
       
   197 
       
   198     static int getType(int ch) {
       
   199         return ((ch & 0xFFFFFF80) == 0 ? ctype[ch] : 0);
       
   200     }
       
   201 
       
   202     static boolean isType(int ch, int type) {
       
   203         return (getType(ch) & type) != 0;
       
   204     }
       
   205 
       
   206     static boolean isAscii(int ch) {
       
   207         return ((ch & 0xFFFFFF80) == 0);
       
   208     }
       
   209 
       
   210     static boolean isAlpha(int ch) {
       
   211         return isType(ch, ALPHA);
       
   212     }
       
   213 
       
   214     static boolean isDigit(int ch) {
       
   215         return ((ch-'0')|('9'-ch)) >= 0;
       
   216     }
       
   217 
       
   218     static boolean isAlnum(int ch) {
       
   219         return isType(ch, ALNUM);
       
   220     }
       
   221 
       
   222     static boolean isGraph(int ch) {
       
   223         return isType(ch, GRAPH);
       
   224     }
       
   225 
       
   226     static boolean isPrint(int ch) {
       
   227         return ((ch-0x20)|(0x7E-ch)) >= 0;
       
   228     }
       
   229 
       
   230     static boolean isPunct(int ch) {
       
   231         return isType(ch, PUNCT);
       
   232     }
       
   233 
       
   234     static boolean isSpace(int ch) {
       
   235         return isType(ch, SPACE);
       
   236     }
       
   237 
       
   238     static boolean isHexDigit(int ch) {
       
   239         return isType(ch, HEX);
       
   240     }
       
   241 
       
   242     static boolean isOctDigit(int ch) {
       
   243         return ((ch-'0')|('7'-ch)) >= 0;
       
   244     }
       
   245 
       
   246     static boolean isCntrl(int ch) {
       
   247         return isType(ch, CNTRL);
       
   248     }
       
   249 
       
   250     static boolean isLower(int ch) {
       
   251         return ((ch-'a')|('z'-ch)) >= 0;
       
   252     }
       
   253 
       
   254     static boolean isUpper(int ch) {
       
   255         return ((ch-'A')|('Z'-ch)) >= 0;
       
   256     }
       
   257 
       
   258     static boolean isWord(int ch) {
       
   259         return isType(ch, WORD);
       
   260     }
       
   261 
       
   262     static int toDigit(int ch) {
       
   263         return (ctype[ch & 0x7F] & 0x3F);
       
   264     }
       
   265 
       
   266     static int toLower(int ch) {
       
   267         return isUpper(ch) ? (ch + 0x20) : ch;
       
   268     }
       
   269 
       
   270     static int toUpper(int ch) {
       
   271         return isLower(ch) ? (ch - 0x20) : ch;
       
   272     }
       
   273 
       
   274 }