jtulach@1348: /* jtulach@1348: * Copyright (c) 1999, 2000, Oracle and/or its affiliates. All rights reserved. jtulach@1348: * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. jtulach@1348: * jtulach@1348: * This code is free software; you can redistribute it and/or modify it jtulach@1348: * under the terms of the GNU General Public License version 2 only, as jtulach@1348: * published by the Free Software Foundation. Oracle designates this jtulach@1348: * particular file as subject to the "Classpath" exception as provided jtulach@1348: * by Oracle in the LICENSE file that accompanied this code. jtulach@1348: * jtulach@1348: * This code is distributed in the hope that it will be useful, but WITHOUT jtulach@1348: * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or jtulach@1348: * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License jtulach@1348: * version 2 for more details (a copy is included in the LICENSE file that jtulach@1348: * accompanied this code). jtulach@1348: * jtulach@1348: * You should have received a copy of the GNU General Public License version jtulach@1348: * 2 along with this work; if not, write to the Free Software Foundation, jtulach@1348: * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. jtulach@1348: * jtulach@1348: * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA jtulach@1348: * or visit www.oracle.com if you need additional information or have any jtulach@1348: * questions. jtulach@1348: */ jtulach@1348: jtulach@1348: package java.util.regex; jtulach@1348: jtulach@1348: jtulach@1348: /** jtulach@1348: * Utility class that implements the standard C ctype functionality. jtulach@1348: * jtulach@1348: * @author Hong Zhang jtulach@1348: */ jtulach@1348: jtulach@1348: final class ASCII { jtulach@1348: jtulach@1348: static final int UPPER = 0x00000100; jtulach@1348: jtulach@1348: static final int LOWER = 0x00000200; jtulach@1348: jtulach@1348: static final int DIGIT = 0x00000400; jtulach@1348: jtulach@1348: static final int SPACE = 0x00000800; jtulach@1348: jtulach@1348: static final int PUNCT = 0x00001000; jtulach@1348: jtulach@1348: static final int CNTRL = 0x00002000; jtulach@1348: jtulach@1348: static final int BLANK = 0x00004000; jtulach@1348: jtulach@1348: static final int HEX = 0x00008000; jtulach@1348: jtulach@1348: static final int UNDER = 0x00010000; jtulach@1348: jtulach@1348: static final int ASCII = 0x0000FF00; jtulach@1348: jtulach@1348: static final int ALPHA = (UPPER|LOWER); jtulach@1348: jtulach@1348: static final int ALNUM = (UPPER|LOWER|DIGIT); jtulach@1348: jtulach@1348: static final int GRAPH = (PUNCT|UPPER|LOWER|DIGIT); jtulach@1348: jtulach@1348: static final int WORD = (UPPER|LOWER|UNDER|DIGIT); jtulach@1348: jtulach@1348: static final int XDIGIT = (HEX); jtulach@1348: jtulach@1348: private static final int[] ctype = new int[] { jtulach@1348: CNTRL, /* 00 (NUL) */ jtulach@1348: CNTRL, /* 01 (SOH) */ jtulach@1348: CNTRL, /* 02 (STX) */ jtulach@1348: CNTRL, /* 03 (ETX) */ jtulach@1348: CNTRL, /* 04 (EOT) */ jtulach@1348: CNTRL, /* 05 (ENQ) */ jtulach@1348: CNTRL, /* 06 (ACK) */ jtulach@1348: CNTRL, /* 07 (BEL) */ jtulach@1348: CNTRL, /* 08 (BS) */ jtulach@1348: SPACE+CNTRL+BLANK, /* 09 (HT) */ jtulach@1348: SPACE+CNTRL, /* 0A (LF) */ jtulach@1348: SPACE+CNTRL, /* 0B (VT) */ jtulach@1348: SPACE+CNTRL, /* 0C (FF) */ jtulach@1348: SPACE+CNTRL, /* 0D (CR) */ jtulach@1348: CNTRL, /* 0E (SI) */ jtulach@1348: CNTRL, /* 0F (SO) */ jtulach@1348: CNTRL, /* 10 (DLE) */ jtulach@1348: CNTRL, /* 11 (DC1) */ jtulach@1348: CNTRL, /* 12 (DC2) */ jtulach@1348: CNTRL, /* 13 (DC3) */ jtulach@1348: CNTRL, /* 14 (DC4) */ jtulach@1348: CNTRL, /* 15 (NAK) */ jtulach@1348: CNTRL, /* 16 (SYN) */ jtulach@1348: CNTRL, /* 17 (ETB) */ jtulach@1348: CNTRL, /* 18 (CAN) */ jtulach@1348: CNTRL, /* 19 (EM) */ jtulach@1348: CNTRL, /* 1A (SUB) */ jtulach@1348: CNTRL, /* 1B (ESC) */ jtulach@1348: CNTRL, /* 1C (FS) */ jtulach@1348: CNTRL, /* 1D (GS) */ jtulach@1348: CNTRL, /* 1E (RS) */ jtulach@1348: CNTRL, /* 1F (US) */ jtulach@1348: SPACE+BLANK, /* 20 SPACE */ jtulach@1348: PUNCT, /* 21 ! */ jtulach@1348: PUNCT, /* 22 " */ jtulach@1348: PUNCT, /* 23 # */ jtulach@1348: PUNCT, /* 24 $ */ jtulach@1348: PUNCT, /* 25 % */ jtulach@1348: PUNCT, /* 26 & */ jtulach@1348: PUNCT, /* 27 ' */ jtulach@1348: PUNCT, /* 28 ( */ jtulach@1348: PUNCT, /* 29 ) */ jtulach@1348: PUNCT, /* 2A * */ jtulach@1348: PUNCT, /* 2B + */ jtulach@1348: PUNCT, /* 2C , */ jtulach@1348: PUNCT, /* 2D - */ jtulach@1348: PUNCT, /* 2E . */ jtulach@1348: PUNCT, /* 2F / */ jtulach@1348: DIGIT+HEX+0, /* 30 0 */ jtulach@1348: DIGIT+HEX+1, /* 31 1 */ jtulach@1348: DIGIT+HEX+2, /* 32 2 */ jtulach@1348: DIGIT+HEX+3, /* 33 3 */ jtulach@1348: DIGIT+HEX+4, /* 34 4 */ jtulach@1348: DIGIT+HEX+5, /* 35 5 */ jtulach@1348: DIGIT+HEX+6, /* 36 6 */ jtulach@1348: DIGIT+HEX+7, /* 37 7 */ jtulach@1348: DIGIT+HEX+8, /* 38 8 */ jtulach@1348: DIGIT+HEX+9, /* 39 9 */ jtulach@1348: PUNCT, /* 3A : */ jtulach@1348: PUNCT, /* 3B ; */ jtulach@1348: PUNCT, /* 3C < */ jtulach@1348: PUNCT, /* 3D = */ jtulach@1348: PUNCT, /* 3E > */ jtulach@1348: PUNCT, /* 3F ? */ jtulach@1348: PUNCT, /* 40 @ */ jtulach@1348: UPPER+HEX+10, /* 41 A */ jtulach@1348: UPPER+HEX+11, /* 42 B */ jtulach@1348: UPPER+HEX+12, /* 43 C */ jtulach@1348: UPPER+HEX+13, /* 44 D */ jtulach@1348: UPPER+HEX+14, /* 45 E */ jtulach@1348: UPPER+HEX+15, /* 46 F */ jtulach@1348: UPPER+16, /* 47 G */ jtulach@1348: UPPER+17, /* 48 H */ jtulach@1348: UPPER+18, /* 49 I */ jtulach@1348: UPPER+19, /* 4A J */ jtulach@1348: UPPER+20, /* 4B K */ jtulach@1348: UPPER+21, /* 4C L */ jtulach@1348: UPPER+22, /* 4D M */ jtulach@1348: UPPER+23, /* 4E N */ jtulach@1348: UPPER+24, /* 4F O */ jtulach@1348: UPPER+25, /* 50 P */ jtulach@1348: UPPER+26, /* 51 Q */ jtulach@1348: UPPER+27, /* 52 R */ jtulach@1348: UPPER+28, /* 53 S */ jtulach@1348: UPPER+29, /* 54 T */ jtulach@1348: UPPER+30, /* 55 U */ jtulach@1348: UPPER+31, /* 56 V */ jtulach@1348: UPPER+32, /* 57 W */ jtulach@1348: UPPER+33, /* 58 X */ jtulach@1348: UPPER+34, /* 59 Y */ jtulach@1348: UPPER+35, /* 5A Z */ jtulach@1348: PUNCT, /* 5B [ */ jtulach@1348: PUNCT, /* 5C \ */ jtulach@1348: PUNCT, /* 5D ] */ jtulach@1348: PUNCT, /* 5E ^ */ jtulach@1348: PUNCT|UNDER, /* 5F _ */ jtulach@1348: PUNCT, /* 60 ` */ jtulach@1348: LOWER+HEX+10, /* 61 a */ jtulach@1348: LOWER+HEX+11, /* 62 b */ jtulach@1348: LOWER+HEX+12, /* 63 c */ jtulach@1348: LOWER+HEX+13, /* 64 d */ jtulach@1348: LOWER+HEX+14, /* 65 e */ jtulach@1348: LOWER+HEX+15, /* 66 f */ jtulach@1348: LOWER+16, /* 67 g */ jtulach@1348: LOWER+17, /* 68 h */ jtulach@1348: LOWER+18, /* 69 i */ jtulach@1348: LOWER+19, /* 6A j */ jtulach@1348: LOWER+20, /* 6B k */ jtulach@1348: LOWER+21, /* 6C l */ jtulach@1348: LOWER+22, /* 6D m */ jtulach@1348: LOWER+23, /* 6E n */ jtulach@1348: LOWER+24, /* 6F o */ jtulach@1348: LOWER+25, /* 70 p */ jtulach@1348: LOWER+26, /* 71 q */ jtulach@1348: LOWER+27, /* 72 r */ jtulach@1348: LOWER+28, /* 73 s */ jtulach@1348: LOWER+29, /* 74 t */ jtulach@1348: LOWER+30, /* 75 u */ jtulach@1348: LOWER+31, /* 76 v */ jtulach@1348: LOWER+32, /* 77 w */ jtulach@1348: LOWER+33, /* 78 x */ jtulach@1348: LOWER+34, /* 79 y */ jtulach@1348: LOWER+35, /* 7A z */ jtulach@1348: PUNCT, /* 7B { */ jtulach@1348: PUNCT, /* 7C | */ jtulach@1348: PUNCT, /* 7D } */ jtulach@1348: PUNCT, /* 7E ~ */ jtulach@1348: CNTRL, /* 7F (DEL) */ jtulach@1348: }; jtulach@1348: jtulach@1348: static int getType(int ch) { jtulach@1348: return ((ch & 0xFFFFFF80) == 0 ? ctype[ch] : 0); jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isType(int ch, int type) { jtulach@1348: return (getType(ch) & type) != 0; jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isAscii(int ch) { jtulach@1348: return ((ch & 0xFFFFFF80) == 0); jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isAlpha(int ch) { jtulach@1348: return isType(ch, ALPHA); jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isDigit(int ch) { jtulach@1348: return ((ch-'0')|('9'-ch)) >= 0; jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isAlnum(int ch) { jtulach@1348: return isType(ch, ALNUM); jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isGraph(int ch) { jtulach@1348: return isType(ch, GRAPH); jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isPrint(int ch) { jtulach@1348: return ((ch-0x20)|(0x7E-ch)) >= 0; jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isPunct(int ch) { jtulach@1348: return isType(ch, PUNCT); jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isSpace(int ch) { jtulach@1348: return isType(ch, SPACE); jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isHexDigit(int ch) { jtulach@1348: return isType(ch, HEX); jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isOctDigit(int ch) { jtulach@1348: return ((ch-'0')|('7'-ch)) >= 0; jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isCntrl(int ch) { jtulach@1348: return isType(ch, CNTRL); jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isLower(int ch) { jtulach@1348: return ((ch-'a')|('z'-ch)) >= 0; jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isUpper(int ch) { jtulach@1348: return ((ch-'A')|('Z'-ch)) >= 0; jtulach@1348: } jtulach@1348: jtulach@1348: static boolean isWord(int ch) { jtulach@1348: return isType(ch, WORD); jtulach@1348: } jtulach@1348: jtulach@1348: static int toDigit(int ch) { jtulach@1348: return (ctype[ch & 0x7F] & 0x3F); jtulach@1348: } jtulach@1348: jtulach@1348: static int toLower(int ch) { jtulach@1348: return isUpper(ch) ? (ch + 0x20) : ch; jtulach@1348: } jtulach@1348: jtulach@1348: static int toUpper(int ch) { jtulach@1348: return isLower(ch) ? (ch - 0x20) : ch; jtulach@1348: } jtulach@1348: jtulach@1348: }