4139N/A/*
4139N/A * Copyright (c) 2011, Oracle and/or its affiliates. All rights reserved.
4139N/A * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4139N/A *
4139N/A * This code is free software; you can redistribute it and/or modify it
4139N/A * under the terms of the GNU General Public License version 2 only, as
4139N/A * published by the Free Software Foundation. Oracle designates this
4139N/A * particular file as subject to the "Classpath" exception as provided
4139N/A * by Oracle in the LICENSE file that accompanied this code.
4139N/A *
4139N/A * This code is distributed in the hope that it will be useful, but WITHOUT
4139N/A * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
4139N/A * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
4139N/A * version 2 for more details (a copy is included in the LICENSE file that
4139N/A * accompanied this code).
4139N/A *
4139N/A * You should have received a copy of the GNU General Public License version
4139N/A * 2 along with this work; if not, write to the Free Software Foundation,
4139N/A * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
4139N/A *
4139N/A * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
4139N/A * or visit www.oracle.com if you need additional information or have any
4139N/A * questions.
4139N/A */
4139N/A
4139N/Apackage java.util.regex;
4139N/A
4139N/Aimport java.util.HashMap;
4139N/Aimport java.util.Locale;
4139N/A
4139N/Aenum UnicodeProp {
4139N/A
4139N/A ALPHABETIC {
4139N/A public boolean is(int ch) {
4139N/A return Character.isAlphabetic(ch);
4139N/A }
4139N/A },
4139N/A
4139N/A LETTER {
4139N/A public boolean is(int ch) {
4139N/A return Character.isLetter(ch);
4139N/A }
4139N/A },
4139N/A
4139N/A IDEOGRAPHIC {
4139N/A public boolean is(int ch) {
4139N/A return Character.isIdeographic(ch);
4139N/A }
4139N/A },
4139N/A
4139N/A LOWERCASE {
4139N/A public boolean is(int ch) {
4139N/A return Character.isLowerCase(ch);
4139N/A }
4139N/A },
4139N/A
4139N/A UPPERCASE {
4139N/A public boolean is(int ch) {
4139N/A return Character.isUpperCase(ch);
4139N/A }
4139N/A },
4139N/A
4139N/A TITLECASE {
4139N/A public boolean is(int ch) {
4139N/A return Character.isTitleCase(ch);
4139N/A }
4139N/A },
4139N/A
4139N/A WHITE_SPACE {
4139N/A // \p{Whitespace}
4139N/A public boolean is(int ch) {
4139N/A return ((((1 << Character.SPACE_SEPARATOR) |
4139N/A (1 << Character.LINE_SEPARATOR) |
4139N/A (1 << Character.PARAGRAPH_SEPARATOR)) >> Character.getType(ch)) & 1)
4139N/A != 0 || (ch >= 0x9 && ch <= 0xd) || (ch == 0x85);
4139N/A }
4139N/A },
4139N/A
4139N/A CONTROL {
4139N/A // \p{gc=Control}
4139N/A public boolean is(int ch) {
4139N/A return Character.getType(ch) == Character.CONTROL;
4139N/A }
4139N/A },
4139N/A
4139N/A PUNCTUATION {
4139N/A // \p{gc=Punctuation}
4139N/A public boolean is(int ch) {
4139N/A return ((((1 << Character.CONNECTOR_PUNCTUATION) |
4139N/A (1 << Character.DASH_PUNCTUATION) |
4139N/A (1 << Character.START_PUNCTUATION) |
4139N/A (1 << Character.END_PUNCTUATION) |
4139N/A (1 << Character.OTHER_PUNCTUATION) |
4139N/A (1 << Character.INITIAL_QUOTE_PUNCTUATION) |
4139N/A (1 << Character.FINAL_QUOTE_PUNCTUATION)) >> Character.getType(ch)) & 1)
4139N/A != 0;
4139N/A }
4139N/A },
4139N/A
4139N/A HEX_DIGIT {
4139N/A // \p{gc=Decimal_Number}
4139N/A // \p{Hex_Digit} -> PropList.txt: Hex_Digit
4139N/A public boolean is(int ch) {
4139N/A return DIGIT.is(ch) ||
4139N/A (ch >= 0x0030 && ch <= 0x0039) ||
4139N/A (ch >= 0x0041 && ch <= 0x0046) ||
4139N/A (ch >= 0x0061 && ch <= 0x0066) ||
4139N/A (ch >= 0xFF10 && ch <= 0xFF19) ||
4139N/A (ch >= 0xFF21 && ch <= 0xFF26) ||
4139N/A (ch >= 0xFF41 && ch <= 0xFF46);
4139N/A }
4139N/A },
4139N/A
4139N/A ASSIGNED {
4139N/A public boolean is(int ch) {
4139N/A return Character.getType(ch) != Character.UNASSIGNED;
4139N/A }
4139N/A },
4139N/A
4139N/A NONCHARACTER_CODE_POINT {
4139N/A // PropList.txt:Noncharacter_Code_Point
4139N/A public boolean is(int ch) {
4139N/A return (ch & 0xfffe) == 0xfffe || (ch >= 0xfdd0 && ch <= 0xfdef);
4139N/A }
4139N/A },
4139N/A
4139N/A DIGIT {
4139N/A // \p{gc=Decimal_Number}
4139N/A public boolean is(int ch) {
4139N/A return Character.isDigit(ch);
4139N/A }
4139N/A },
4139N/A
4139N/A ALNUM {
4139N/A // \p{alpha}
4139N/A // \p{digit}
4139N/A public boolean is(int ch) {
4139N/A return ALPHABETIC.is(ch) || DIGIT.is(ch);
4139N/A }
4139N/A },
4139N/A
4139N/A BLANK {
4139N/A // \p{Whitespace} --
4139N/A // [\N{LF} \N{VT} \N{FF} \N{CR} \N{NEL} -> 0xa, 0xb, 0xc, 0xd, 0x85
4139N/A // \p{gc=Line_Separator}
4139N/A // \p{gc=Paragraph_Separator}]
4139N/A public boolean is(int ch) {
4139N/A return Character.getType(ch) == Character.SPACE_SEPARATOR ||
4139N/A ch == 0x9; // \N{HT}
4139N/A }
4139N/A },
4139N/A
4139N/A GRAPH {
4139N/A // [^
4139N/A // \p{space}
4139N/A // \p{gc=Control}
4139N/A // \p{gc=Surrogate}
4139N/A // \p{gc=Unassigned}]
4139N/A public boolean is(int ch) {
4139N/A return ((((1 << Character.SPACE_SEPARATOR) |
4139N/A (1 << Character.LINE_SEPARATOR) |
4139N/A (1 << Character.PARAGRAPH_SEPARATOR) |
4139N/A (1 << Character.CONTROL) |
4139N/A (1 << Character.SURROGATE) |
4139N/A (1 << Character.UNASSIGNED)) >> Character.getType(ch)) & 1)
4139N/A == 0;
4139N/A }
4139N/A },
4139N/A
4139N/A PRINT {
4139N/A // \p{graph}
4139N/A // \p{blank}
4139N/A // -- \p{cntrl}
4139N/A public boolean is(int ch) {
4139N/A return (GRAPH.is(ch) || BLANK.is(ch)) && !CONTROL.is(ch);
4139N/A }
4139N/A },
4139N/A
4139N/A WORD {
4139N/A // \p{alpha}
4139N/A // \p{gc=Mark}
4139N/A // \p{digit}
4139N/A // \p{gc=Connector_Punctuation}
4139N/A
4139N/A public boolean is(int ch) {
4139N/A return ALPHABETIC.is(ch) ||
4139N/A ((((1 << Character.NON_SPACING_MARK) |
4139N/A (1 << Character.ENCLOSING_MARK) |
4139N/A (1 << Character.COMBINING_SPACING_MARK) |
4139N/A (1 << Character.DECIMAL_DIGIT_NUMBER) |
4139N/A (1 << Character.CONNECTOR_PUNCTUATION)) >> Character.getType(ch)) & 1)
4139N/A != 0;
4139N/A }
4139N/A };
4139N/A
4139N/A private final static HashMap<String, String> posix = new HashMap<>();
4139N/A private final static HashMap<String, String> aliases = new HashMap<>();
4139N/A static {
4139N/A posix.put("ALPHA", "ALPHABETIC");
4139N/A posix.put("LOWER", "LOWERCASE");
4139N/A posix.put("UPPER", "UPPERCASE");
4139N/A posix.put("SPACE", "WHITE_SPACE");
4139N/A posix.put("PUNCT", "PUNCTUATION");
4139N/A posix.put("XDIGIT","HEX_DIGIT");
4139N/A posix.put("ALNUM", "ALNUM");
4139N/A posix.put("CNTRL", "CONTROL");
4139N/A posix.put("DIGIT", "DIGIT");
4139N/A posix.put("BLANK", "BLANK");
4139N/A posix.put("GRAPH", "GRAPH");
4139N/A posix.put("PRINT", "PRINT");
4139N/A
4139N/A aliases.put("WHITESPACE", "WHITE_SPACE");
4139N/A aliases.put("HEXDIGIT","HEX_DIGIT");
4139N/A aliases.put("NONCHARACTERCODEPOINT", "NONCHARACTER_CODE_POINT");
4139N/A }
4139N/A
4139N/A public static UnicodeProp forName(String propName) {
4139N/A propName = propName.toUpperCase(Locale.ENGLISH);
4139N/A String alias = aliases.get(propName);
4139N/A if (alias != null)
4139N/A propName = alias;
4139N/A try {
4139N/A return valueOf (propName);
4139N/A } catch (IllegalArgumentException x) {}
4139N/A return null;
4139N/A }
4139N/A
4139N/A public static UnicodeProp forPOSIXName(String propName) {
4139N/A propName = posix.get(propName.toUpperCase(Locale.ENGLISH));
4139N/A if (propName == null)
4139N/A return null;
4139N/A return valueOf (propName);
4139N/A }
4139N/A
4139N/A public abstract boolean is(int ch);
4139N/A}