1 /*
   2  * Copyright (c) 2011, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  20  * or visit www.oracle.com if you need additional information or have any
  21  * questions.
  22  */
  23 
  24 
  25 final class POSIX_ASCII {
  26 
  27     static final int UPPER   = 0x00000100;
  28 
  29     static final int LOWER   = 0x00000200;
  30 
  31     static final int DIGIT   = 0x00000400;
  32 
  33     static final int SPACE   = 0x00000800;
  34 
  35     static final int PUNCT   = 0x00001000;
  36 
  37     static final int CNTRL   = 0x00002000;
  38 
  39     static final int BLANK   = 0x00004000;
  40 
  41     static final int HEX     = 0x00008000;
  42 
  43     static final int UNDER   = 0x00010000;
  44 
  45     static final int ASCII   = 0x0000FF00;
  46 
  47     static final int ALPHA   = (UPPER|LOWER);
  48 
  49     static final int ALNUM   = (UPPER|LOWER|DIGIT);
  50 
  51     static final int GRAPH   = (PUNCT|UPPER|LOWER|DIGIT);
  52 
  53     static final int WORD    = (UPPER|LOWER|UNDER|DIGIT);
  54 
  55     static final int XDIGIT  = (HEX);
  56 
  57     private static final int[] ctype = new int[] {
  58         CNTRL,                  /* 00 (NUL) */
  59         CNTRL,                  /* 01 (SOH) */
  60         CNTRL,                  /* 02 (STX) */
  61         CNTRL,                  /* 03 (ETX) */
  62         CNTRL,                  /* 04 (EOT) */
  63         CNTRL,                  /* 05 (ENQ) */
  64         CNTRL,                  /* 06 (ACK) */
  65         CNTRL,                  /* 07 (BEL) */
  66         CNTRL,                  /* 08 (BS)  */
  67         SPACE+CNTRL+BLANK,      /* 09 (HT)  */
  68         SPACE+CNTRL,            /* 0A (LF)  */
  69         SPACE+CNTRL,            /* 0B (VT)  */
  70         SPACE+CNTRL,            /* 0C (FF)  */
  71         SPACE+CNTRL,            /* 0D (CR)  */
  72         CNTRL,                  /* 0E (SI)  */
  73         CNTRL,                  /* 0F (SO)  */
  74         CNTRL,                  /* 10 (DLE) */
  75         CNTRL,                  /* 11 (DC1) */
  76         CNTRL,                  /* 12 (DC2) */
  77         CNTRL,                  /* 13 (DC3) */
  78         CNTRL,                  /* 14 (DC4) */
  79         CNTRL,                  /* 15 (NAK) */
  80         CNTRL,                  /* 16 (SYN) */
  81         CNTRL,                  /* 17 (ETB) */
  82         CNTRL,                  /* 18 (CAN) */
  83         CNTRL,                  /* 19 (EM)  */
  84         CNTRL,                  /* 1A (SUB) */
  85         CNTRL,                  /* 1B (ESC) */
  86         CNTRL,                  /* 1C (FS)  */
  87         CNTRL,                  /* 1D (GS)  */
  88         CNTRL,                  /* 1E (RS)  */
  89         CNTRL,                  /* 1F (US)  */
  90         SPACE+BLANK,            /* 20 SPACE */
  91         PUNCT,                  /* 21 !     */
  92         PUNCT,                  /* 22 "     */
  93         PUNCT,                  /* 23 #     */
  94         PUNCT,                  /* 24 $     */
  95         PUNCT,                  /* 25 %     */
  96         PUNCT,                  /* 26 &     */
  97         PUNCT,                  /* 27 '     */
  98         PUNCT,                  /* 28 (     */
  99         PUNCT,                  /* 29 )     */
 100         PUNCT,                  /* 2A *     */
 101         PUNCT,                  /* 2B +     */
 102         PUNCT,                  /* 2C ,     */
 103         PUNCT,                  /* 2D -     */
 104         PUNCT,                  /* 2E .     */
 105         PUNCT,                  /* 2F /     */
 106         DIGIT+HEX+0,            /* 30 0     */
 107         DIGIT+HEX+1,            /* 31 1     */
 108         DIGIT+HEX+2,            /* 32 2     */
 109         DIGIT+HEX+3,            /* 33 3     */
 110         DIGIT+HEX+4,            /* 34 4     */
 111         DIGIT+HEX+5,            /* 35 5     */
 112         DIGIT+HEX+6,            /* 36 6     */
 113         DIGIT+HEX+7,            /* 37 7     */
 114         DIGIT+HEX+8,            /* 38 8     */
 115         DIGIT+HEX+9,            /* 39 9     */
 116         PUNCT,                  /* 3A :     */
 117         PUNCT,                  /* 3B ;     */
 118         PUNCT,                  /* 3C <     */
 119         PUNCT,                  /* 3D =     */
 120         PUNCT,                  /* 3E >     */
 121         PUNCT,                  /* 3F ?     */
 122         PUNCT,                  /* 40 @     */
 123         UPPER+HEX+10,           /* 41 A     */
 124         UPPER+HEX+11,           /* 42 B     */
 125         UPPER+HEX+12,           /* 43 C     */
 126         UPPER+HEX+13,           /* 44 D     */
 127         UPPER+HEX+14,           /* 45 E     */
 128         UPPER+HEX+15,           /* 46 F     */
 129         UPPER+16,               /* 47 G     */
 130         UPPER+17,               /* 48 H     */
 131         UPPER+18,               /* 49 I     */
 132         UPPER+19,               /* 4A J     */
 133         UPPER+20,               /* 4B K     */
 134         UPPER+21,               /* 4C L     */
 135         UPPER+22,               /* 4D M     */
 136         UPPER+23,               /* 4E N     */
 137         UPPER+24,               /* 4F O     */
 138         UPPER+25,               /* 50 P     */
 139         UPPER+26,               /* 51 Q     */
 140         UPPER+27,               /* 52 R     */
 141         UPPER+28,               /* 53 S     */
 142         UPPER+29,               /* 54 T     */
 143         UPPER+30,               /* 55 U     */
 144         UPPER+31,               /* 56 V     */
 145         UPPER+32,               /* 57 W     */
 146         UPPER+33,               /* 58 X     */
 147         UPPER+34,               /* 59 Y     */
 148         UPPER+35,               /* 5A Z     */
 149         PUNCT,                  /* 5B [     */
 150         PUNCT,                  /* 5C \     */
 151         PUNCT,                  /* 5D ]     */
 152         PUNCT,                  /* 5E ^     */
 153         PUNCT|UNDER,            /* 5F _     */
 154         PUNCT,                  /* 60 `     */
 155         LOWER+HEX+10,           /* 61 a     */
 156         LOWER+HEX+11,           /* 62 b     */
 157         LOWER+HEX+12,           /* 63 c     */
 158         LOWER+HEX+13,           /* 64 d     */
 159         LOWER+HEX+14,           /* 65 e     */
 160         LOWER+HEX+15,           /* 66 f     */
 161         LOWER+16,               /* 67 g     */
 162         LOWER+17,               /* 68 h     */
 163         LOWER+18,               /* 69 i     */
 164         LOWER+19,               /* 6A j     */
 165         LOWER+20,               /* 6B k     */
 166         LOWER+21,               /* 6C l     */
 167         LOWER+22,               /* 6D m     */
 168         LOWER+23,               /* 6E n     */
 169         LOWER+24,               /* 6F o     */
 170         LOWER+25,               /* 70 p     */
 171         LOWER+26,               /* 71 q     */
 172         LOWER+27,               /* 72 r     */
 173         LOWER+28,               /* 73 s     */
 174         LOWER+29,               /* 74 t     */
 175         LOWER+30,               /* 75 u     */
 176         LOWER+31,               /* 76 v     */
 177         LOWER+32,               /* 77 w     */
 178         LOWER+33,               /* 78 x     */
 179         LOWER+34,               /* 79 y     */
 180         LOWER+35,               /* 7A z     */
 181         PUNCT,                  /* 7B {     */
 182         PUNCT,                  /* 7C |     */
 183         PUNCT,                  /* 7D }     */
 184         PUNCT,                  /* 7E ~     */
 185         CNTRL,                  /* 7F (DEL) */
 186     };
 187 
 188     static int getType(int ch) {
 189         return ((ch & 0xFFFFFF80) == 0 ? ctype[ch] : 0);
 190     }
 191 
 192     static boolean isType(int ch, int type) {
 193         return (getType(ch) & type) != 0;
 194     }
 195 
 196     static boolean isAscii(int ch) {
 197         return ((ch & 0xFFFFFF80) == 0);
 198     }
 199 
 200     static boolean isAlpha(int ch) {
 201         return isType(ch, ALPHA);
 202     }
 203 
 204     static boolean isDigit(int ch) {
 205         return ((ch-'0')|('9'-ch)) >= 0;
 206     }
 207 
 208     static boolean isAlnum(int ch) {
 209         return isType(ch, ALNUM);
 210     }
 211 
 212     static boolean isGraph(int ch) {
 213         return isType(ch, GRAPH);
 214     }
 215 
 216     static boolean isPrint(int ch) {
 217         return ((ch-0x20)|(0x7E-ch)) >= 0;
 218     }
 219 
 220     static boolean isPunct(int ch) {
 221         return isType(ch, PUNCT);
 222     }
 223 
 224     static boolean isSpace(int ch) {
 225         return isType(ch, SPACE);
 226     }
 227 
 228     static boolean isHexDigit(int ch) {
 229         return isType(ch, HEX);
 230     }
 231 
 232     static boolean isCntrl(int ch) {
 233         return isType(ch, CNTRL);
 234     }
 235 
 236     static boolean isLower(int ch) {
 237         return ((ch-'a')|('z'-ch)) >= 0;
 238     }
 239 
 240     static boolean isUpper(int ch) {
 241         return ((ch-'A')|('Z'-ch)) >= 0;
 242     }
 243 
 244     static boolean isWord(int ch) {
 245         return isType(ch, WORD);
 246     }
 247 }