1 /*
   2  * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.  Oracle designates this
   8  * particular file as subject to the "Classpath" exception as provided
   9  * by Oracle in the LICENSE file that accompanied this code.
  10  *
  11  * This code is distributed in the hope that it will be useful, but WITHOUT
  12  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14  * version 2 for more details (a copy is included in the LICENSE file that
  15  * accompanied this code).
  16  *
  17  * You should have received a copy of the GNU General Public License version
  18  * 2 along with this work; if not, write to the Free Software Foundation,
  19  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  20  *
  21  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  22  * or visit www.oracle.com if you need additional information or have any
  23  * questions.
  24  */
  25 
  26 package com.sun.xml.internal.rngom.xml.util;
  27 
  28 public class Naming {
  29 
  30   private Naming() { }
  31 
  32   private static final int CT_NAME = 1;
  33   private static final int CT_NMSTRT = 2;
  34 
  35   private static final String nameStartSingles =
  36   "\u003a\u005f\u0386\u038c\u03da\u03dc\u03de\u03e0\u0559\u06d5\u093d\u09b2" +
  37   "\u0a5e\u0a8d\u0abd\u0ae0\u0b3d\u0b9c\u0cde\u0e30\u0e84\u0e8a\u0e8d\u0ea5" +
  38   "\u0ea7\u0eb0\u0ebd\u1100\u1109\u113c\u113e\u1140\u114c\u114e\u1150\u1159" +
  39   "\u1163\u1165\u1167\u1169\u1175\u119e\u11a8\u11ab\u11ba\u11eb\u11f0\u11f9" +
  40   "\u1f59\u1f5b\u1f5d\u1fbe\u2126\u212e\u3007";
  41   private static final String nameStartRanges =
  42   "\u0041\u005a\u0061\u007a\u00c0\u00d6\u00d8\u00f6\u00f8\u00ff\u0100\u0131" +
  43   "\u0134\u013e\u0141\u0148\u014a\u017e\u0180\u01c3\u01cd\u01f0\u01f4\u01f5" +
  44   "\u01fa\u0217\u0250\u02a8\u02bb\u02c1\u0388\u038a\u038e\u03a1\u03a3\u03ce" +
  45   "\u03d0\u03d6\u03e2\u03f3\u0401\u040c\u040e\u044f\u0451\u045c\u045e\u0481" +
  46   "\u0490\u04c4\u04c7\u04c8\u04cb\u04cc\u04d0\u04eb\u04ee\u04f5\u04f8\u04f9" +
  47   "\u0531\u0556\u0561\u0586\u05d0\u05ea\u05f0\u05f2\u0621\u063a\u0641\u064a" +
  48   "\u0671\u06b7\u06ba\u06be\u06c0\u06ce\u06d0\u06d3\u06e5\u06e6\u0905\u0939" +
  49   "\u0958\u0961\u0985\u098c\u098f\u0990\u0993\u09a8\u09aa\u09b0\u09b6\u09b9" +
  50   "\u09dc\u09dd\u09df\u09e1\u09f0\u09f1\u0a05\u0a0a\u0a0f\u0a10\u0a13\u0a28" +
  51   "\u0a2a\u0a30\u0a32\u0a33\u0a35\u0a36\u0a38\u0a39\u0a59\u0a5c\u0a72\u0a74" +
  52   "\u0a85\u0a8b\u0a8f\u0a91\u0a93\u0aa8\u0aaa\u0ab0\u0ab2\u0ab3\u0ab5\u0ab9" +
  53   "\u0b05\u0b0c\u0b0f\u0b10\u0b13\u0b28\u0b2a\u0b30\u0b32\u0b33\u0b36\u0b39" +
  54   "\u0b5c\u0b5d\u0b5f\u0b61\u0b85\u0b8a\u0b8e\u0b90\u0b92\u0b95\u0b99\u0b9a" +
  55   "\u0b9e\u0b9f\u0ba3\u0ba4\u0ba8\u0baa\u0bae\u0bb5\u0bb7\u0bb9\u0c05\u0c0c" +
  56   "\u0c0e\u0c10\u0c12\u0c28\u0c2a\u0c33\u0c35\u0c39\u0c60\u0c61\u0c85\u0c8c" +
  57   "\u0c8e\u0c90\u0c92\u0ca8\u0caa\u0cb3\u0cb5\u0cb9\u0ce0\u0ce1\u0d05\u0d0c" +
  58   "\u0d0e\u0d10\u0d12\u0d28\u0d2a\u0d39\u0d60\u0d61\u0e01\u0e2e\u0e32\u0e33" +
  59   "\u0e40\u0e45\u0e81\u0e82\u0e87\u0e88\u0e94\u0e97\u0e99\u0e9f\u0ea1\u0ea3" +
  60   "\u0eaa\u0eab\u0ead\u0eae\u0eb2\u0eb3\u0ec0\u0ec4\u0f40\u0f47\u0f49\u0f69" +
  61   "\u10a0\u10c5\u10d0\u10f6\u1102\u1103\u1105\u1107\u110b\u110c\u110e\u1112" +
  62   "\u1154\u1155\u115f\u1161\u116d\u116e\u1172\u1173\u11ae\u11af\u11b7\u11b8" +
  63   "\u11bc\u11c2\u1e00\u1e9b\u1ea0\u1ef9\u1f00\u1f15\u1f18\u1f1d\u1f20\u1f45" +
  64   "\u1f48\u1f4d\u1f50\u1f57\u1f5f\u1f7d\u1f80\u1fb4\u1fb6\u1fbc\u1fc2\u1fc4" +
  65   "\u1fc6\u1fcc\u1fd0\u1fd3\u1fd6\u1fdb\u1fe0\u1fec\u1ff2\u1ff4\u1ff6\u1ffc" +
  66   "\u212a\u212b\u2180\u2182\u3041\u3094\u30a1\u30fa\u3105\u312c\uac00\ud7a3" +
  67   "\u4e00\u9fa5\u3021\u3029";
  68   private static final String nameSingles =
  69   "\u002d\u002e\u05bf\u05c4\u0670\u093c\u094d\u09bc\u09be\u09bf\u09d7\u0a02" +
  70   "\u0a3c\u0a3e\u0a3f\u0abc\u0b3c\u0bd7\u0d57\u0e31\u0eb1\u0f35\u0f37\u0f39" +
  71   "\u0f3e\u0f3f\u0f97\u0fb9\u20e1\u3099\u309a\u00b7\u02d0\u02d1\u0387\u0640" +
  72   "\u0e46\u0ec6\u3005";
  73   private static final String nameRanges =
  74   "\u0300\u0345\u0360\u0361\u0483\u0486\u0591\u05a1\u05a3\u05b9\u05bb\u05bd" +
  75   "\u05c1\u05c2\u064b\u0652\u06d6\u06dc\u06dd\u06df\u06e0\u06e4\u06e7\u06e8" +
  76   "\u06ea\u06ed\u0901\u0903\u093e\u094c\u0951\u0954\u0962\u0963\u0981\u0983" +
  77   "\u09c0\u09c4\u09c7\u09c8\u09cb\u09cd\u09e2\u09e3\u0a40\u0a42\u0a47\u0a48" +
  78   "\u0a4b\u0a4d\u0a70\u0a71\u0a81\u0a83\u0abe\u0ac5\u0ac7\u0ac9\u0acb\u0acd" +
  79   "\u0b01\u0b03\u0b3e\u0b43\u0b47\u0b48\u0b4b\u0b4d\u0b56\u0b57\u0b82\u0b83" +
  80   "\u0bbe\u0bc2\u0bc6\u0bc8\u0bca\u0bcd\u0c01\u0c03\u0c3e\u0c44\u0c46\u0c48" +
  81   "\u0c4a\u0c4d\u0c55\u0c56\u0c82\u0c83\u0cbe\u0cc4\u0cc6\u0cc8\u0cca\u0ccd" +
  82   "\u0cd5\u0cd6\u0d02\u0d03\u0d3e\u0d43\u0d46\u0d48\u0d4a\u0d4d\u0e34\u0e3a" +
  83   "\u0e47\u0e4e\u0eb4\u0eb9\u0ebb\u0ebc\u0ec8\u0ecd\u0f18\u0f19\u0f71\u0f84" +
  84   "\u0f86\u0f8b\u0f90\u0f95\u0f99\u0fad\u0fb1\u0fb7\u20d0\u20dc\u302a\u302f" +
  85   "\u0030\u0039\u0660\u0669\u06f0\u06f9\u0966\u096f\u09e6\u09ef\u0a66\u0a6f" +
  86   "\u0ae6\u0aef\u0b66\u0b6f\u0be7\u0bef\u0c66\u0c6f\u0ce6\u0cef\u0d66\u0d6f" +
  87   "\u0e50\u0e59\u0ed0\u0ed9\u0f20\u0f29\u3031\u3035\u309d\u309e\u30fc\u30fe";
  88 
  89   private final static byte[][] charTypeTable;
  90 
  91   static {
  92     charTypeTable = new byte[256][];
  93     for (int i = 0; i < nameSingles.length(); i++)
  94       setCharType(nameSingles.charAt(i), CT_NAME);
  95     for (int i = 0; i < nameRanges.length(); i += 2)
  96       setCharType(nameRanges.charAt(i), nameRanges.charAt(i + 1), CT_NAME);
  97     for (int i = 0; i < nameStartSingles.length(); i++)
  98       setCharType(nameStartSingles.charAt(i), CT_NMSTRT);
  99     for (int i = 0; i < nameStartRanges.length(); i += 2)
 100       setCharType(nameStartRanges.charAt(i), nameStartRanges.charAt(i + 1),
 101                   CT_NMSTRT);
 102     byte[] other = new byte[256];
 103     for (int i = 0; i < 256; i++)
 104       if (charTypeTable[i] == null)
 105         charTypeTable[i] = other;
 106   }
 107 
 108   private static void setCharType(char c, int type) {
 109     int hi = c >> 8;
 110     if (charTypeTable[hi] == null)
 111       charTypeTable[hi] = new byte[256];
 112     charTypeTable[hi][c & 0xFF] = (byte)type;
 113   }
 114 
 115   private static void setCharType(char min, char max, int type) {
 116     byte[] shared = null;
 117     do {
 118       if ((min & 0xFF) == 0) {
 119         for (; min + 0xFF <= max; min += 0x100) {
 120           if (shared == null) {
 121             shared = new byte[256];
 122             for (int i = 0; i < 256; i++)
 123               shared[i] = (byte)type;
 124           }
 125           charTypeTable[min >> 8] = shared;
 126           if (min + 0xFF == max)
 127             return;
 128         }
 129       }
 130       setCharType(min, type);
 131     } while (min++ != max);
 132   }
 133 
 134   private static boolean isNameStartChar(char c) {
 135     return charTypeTable[c >> 8][c & 0xff] == CT_NMSTRT;
 136   }
 137 
 138   private static boolean isNameStartCharNs(char c) {
 139     return isNameStartChar(c) && c != ':';
 140   }
 141 
 142   private static boolean isNameChar(char c) {
 143     return charTypeTable[c >> 8][c & 0xff] != 0;
 144   }
 145 
 146   private static boolean isNameCharNs(char c) {
 147     return isNameChar(c) && c != ':';
 148   }
 149 
 150   public static boolean isName(String s) {
 151     int len = s.length();
 152     if (len == 0)
 153       return false;
 154     if (!isNameStartChar(s.charAt(0)))
 155       return false;
 156     for (int i = 1; i < len; i++)
 157       if (!isNameChar(s.charAt(i)))
 158         return false;
 159     return true;
 160   }
 161 
 162   public static boolean isNmtoken(String s) {
 163     int len = s.length();
 164     if (len == 0)
 165       return false;
 166     for (int i = 0; i < len; i++)
 167       if (!isNameChar(s.charAt(i)))
 168         return false;
 169     return true;
 170   }
 171 
 172   public static boolean isNcname(String s) {
 173     int len = s.length();
 174     if (len == 0)
 175       return false;
 176     if (!isNameStartCharNs(s.charAt(0)))
 177       return false;
 178     for (int i = 1; i < len; i++)
 179       if (!isNameCharNs(s.charAt(i)))
 180         return false;
 181     return true;
 182   }
 183 
 184   public static boolean isQname(String s) {
 185     int len = s.length();
 186     if (len == 0)
 187       return false;
 188     if (!isNameStartCharNs(s.charAt(0)))
 189       return false;
 190     for (int i = 1; i < len; i++) {
 191       char c = s.charAt(i);
 192       if (!isNameChar(c)) {
 193         if (c == ':' && ++i < len && isNameStartCharNs(s.charAt(i))) {
 194           for (++i; i < len; i++)
 195             if (!isNameCharNs(s.charAt(i)))
 196               return false;
 197           return true;
 198         }
 199         return false;
 200       }
 201     }
 202     return true;
 203   }
 204 
 205 
 206 }