310 lines
14 KiB
Java
310 lines
14 KiB
Java
/*
|
|
* Copyright (c) 2019, Oracle and/or its affiliates. All rights reserved.
|
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
*
|
|
* This code is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU General Public License version 2 only, as
|
|
* published by the Free Software Foundation.
|
|
*
|
|
* This code is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
* version 2 for more details (a copy is included in the LICENSE file that
|
|
* accompanied this code).
|
|
*
|
|
* You should have received a copy of the GNU General Public License version
|
|
* 2 along with this work; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*
|
|
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
|
|
* or visit www.oracle.com if you need additional information or have any
|
|
* questions.
|
|
*/
|
|
|
|
/**
|
|
* @test
|
|
* @summary Test behavior of isJavaIdentifierXX, testIsJavaLetter, and
|
|
* testIsJavaLetterOrDigit methods for all code points.
|
|
* @bug 8218915
|
|
*/
|
|
|
|
import java.util.List;
|
|
import java.util.ArrayList;
|
|
|
|
public class TestIsJavaIdentifierMethods {
|
|
|
|
// List of new code points are not present in Unicode 6.2.
|
|
private static final List<Integer> UNASSIGNED_CODEPOINTS_IN_6_2
|
|
= new ArrayList<Integer>()
|
|
{{
|
|
add(0x20BB); // NORDIC MARK SIGN
|
|
add(0x20BC); // MANAT SIGN
|
|
add(0x20BD); // RUBLE SIGN
|
|
add(0x20BE); // LARI SIGN
|
|
add(0x20BF); // BITCOIN SIGN
|
|
add(0x32FF); // SQUARE ERA NAME NEWERA
|
|
}};
|
|
|
|
public static void main(String[] args) {
|
|
testIsJavaIdentifierPart_int();
|
|
testIsJavaIdentifierPart_char();
|
|
testIsJavaIdentifierStart_int();
|
|
testIsJavaIdentifierStart_char();
|
|
testIsJavaLetter();
|
|
testIsJavaLetterOrDigit();
|
|
}
|
|
|
|
/**
|
|
* Assertion testing for public static boolean isJavaIdentifierPart(int
|
|
* codePoint), A character may be part of a Java identifier if any of the
|
|
* following are true:
|
|
* <ul>
|
|
* <li>it is a letter</li>
|
|
* <li>it is a currency symbol (such as <code>'$'</code>)</li>
|
|
* <li>it is a connecting punctuation character (such as <code>'_'</code>)
|
|
* </li>
|
|
* <li>it is a digit</li>
|
|
* <li>it is a numeric letter (such as a Roman numeral character)</li>
|
|
* <li>it is a combining mark</li>
|
|
* <li>it is a non-spacing mark</li>
|
|
* <li><code>isIdentifierIgnorable</code> returns <code>true</code> for the
|
|
* character</li>
|
|
* </ul>
|
|
* All code points from (0x0000..0x10FFFF) are tested.
|
|
*/
|
|
public static void testIsJavaIdentifierPart_int() {
|
|
for (int cp = 0; cp <= Character.MAX_CODE_POINT; cp++) {
|
|
boolean expected = false;
|
|
|
|
// Since Character.isJavaIdentifierPart(int) strictly conforms to
|
|
// character information from version 6.2 of the Unicode Standard,
|
|
// check if code point is in "UNASSIGNED_CODEPOINTS_IN_6_2"
|
|
// list. If the code point is found in list
|
|
// "UNASSIGNED_CODEPOINTS_IN_6_2", value of variable
|
|
// "expected" is considered false.
|
|
if (!UNASSIGNED_CODEPOINTS_IN_6_2.contains(cp)) {
|
|
byte type = (byte) Character.getType(cp);
|
|
expected = Character.isLetter(cp)
|
|
|| type == Character.CURRENCY_SYMBOL
|
|
|| type == Character.CONNECTOR_PUNCTUATION
|
|
|| Character.isDigit(cp)
|
|
|| type == Character.LETTER_NUMBER
|
|
|| type == Character.COMBINING_SPACING_MARK
|
|
|| type == Character.NON_SPACING_MARK
|
|
|| Character.isIdentifierIgnorable(cp);
|
|
}
|
|
|
|
if (Character.isJavaIdentifierPart(cp) != expected) {
|
|
throw new RuntimeException(
|
|
"Character.isJavaIdentifierPart(int) failed for codepoint "
|
|
+ Integer.toHexString(cp));
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Assertion testing for public static boolean isJavaIdentifierPart(char
|
|
* ch), A character may be part of a Java identifier if any of the
|
|
* following are true:
|
|
* <ul>
|
|
* <li>it is a letter;
|
|
* <li>it is a currency symbol (such as "$");
|
|
* <li>it is a connecting punctuation character (such as "_");
|
|
* <li>it is a digit;
|
|
* <li>it is a numeric letter (such as a Roman numeral character);
|
|
* <li>it is a combining mark;
|
|
* <li>it is a non-spacing mark;
|
|
* <li>isIdentifierIgnorable returns true for the character.
|
|
* </ul>
|
|
* All Unicode code points in the BMP (0x0000..0xFFFF) are tested.
|
|
*/
|
|
public static void testIsJavaIdentifierPart_char() {
|
|
for (int i = 0; i <= Character.MAX_VALUE; ++i) {
|
|
char ch = (char) i;
|
|
boolean expected = false;
|
|
// Since Character.isJavaIdentifierPart(char) strictly conforms to
|
|
// character information from version 6.2 of the Unicode Standard,
|
|
// check if code point is in "UNASSIGNED_CODEPOINTS_IN_6_2"
|
|
// list. If the code point is found in list
|
|
// "UNASSIGNED_CODEPOINTS_IN_6_2", value of variable
|
|
// "expected" is considered false.
|
|
if (!UNASSIGNED_CODEPOINTS_IN_6_2.contains(i)) {
|
|
byte type = (byte) Character.getType(ch);
|
|
expected = Character.isLetter(ch)
|
|
|| type == Character.CURRENCY_SYMBOL
|
|
|| type == Character.CONNECTOR_PUNCTUATION
|
|
|| Character.isDigit(ch)
|
|
|| type == Character.LETTER_NUMBER
|
|
|| type == Character.COMBINING_SPACING_MARK
|
|
|| type == Character.NON_SPACING_MARK
|
|
|| Character.isIdentifierIgnorable(ch);
|
|
}
|
|
|
|
if (Character.isJavaIdentifierPart((char) i) != expected) {
|
|
throw new RuntimeException(
|
|
"Character.isJavaIdentifierPart(char) failed for codepoint "
|
|
+ Integer.toHexString(i));
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Assertion testing for public static boolean isJavaIdentifierStart(int
|
|
* codePoint), A character may start a Java identifier if and only if it is
|
|
* one of the following:
|
|
* <ul>
|
|
* <li>it is a letter;</li>
|
|
* <li>getType(ch) returns LETTER_NUMBER;</li>
|
|
* <li>it is a currency symbol (such as "$");</li>
|
|
* <li>it is a connecting punctuation character (such as "_");</li>
|
|
* </ul>
|
|
* All Code points from (0x0000..0x10FFFF) are tested.
|
|
*/
|
|
public static void testIsJavaIdentifierStart_int() {
|
|
for (int cp = 0; cp <= Character.MAX_CODE_POINT; cp++) {
|
|
boolean expected = false;
|
|
// Since Character.isJavaIdentifierStart(int) strictly conforms to
|
|
// character information from version 6.2 of the Unicode Standard,
|
|
// check if code point is in "UNASSIGNED_CODEPOINTS_IN_6_2"
|
|
// list. If the code point is found in list
|
|
// "UNASSIGNED_CODEPOINTS_IN_6_2", value of variable
|
|
// "expected" is considered false.
|
|
if (!UNASSIGNED_CODEPOINTS_IN_6_2.contains(cp)) {
|
|
byte type = (byte) Character.getType(cp);
|
|
expected = Character.isLetter(cp)
|
|
|| type == Character.LETTER_NUMBER
|
|
|| type == Character.CURRENCY_SYMBOL
|
|
|| type == Character.CONNECTOR_PUNCTUATION;
|
|
}
|
|
|
|
if (Character.isJavaIdentifierStart(cp) != expected) {
|
|
throw new RuntimeException(
|
|
"Character.isJavaIdentifierStart(int) failed for codepoint "
|
|
+ Integer.toHexString(cp));
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Assertion testing for public static boolean isJavaIdentifierStart(char),
|
|
* A character may start a Java identifier if and only if it is
|
|
* one of the following:
|
|
* <ul>
|
|
* <li>it is a letter;</li>
|
|
* <li>getType(ch) returns LETTER_NUMBER;</li>
|
|
* <li>it is a currency symbol (such as "$");</li>
|
|
* <li>it is a connecting punctuation character (such as "_");</li>
|
|
* </ul>
|
|
* All Unicode code points in the BMP (0x0000..0xFFFF) are tested.
|
|
*/
|
|
public static void testIsJavaIdentifierStart_char() {
|
|
for (int i = 0; i <= Character.MAX_VALUE; i++) {
|
|
char ch = (char) i;
|
|
boolean expected = false;
|
|
// Since Character.isJavaIdentifierStart(char) strictly conforms to
|
|
// character information from version 6.2 of the Unicode Standard,
|
|
// check if code point is in "UNASSIGNED_CODEPOINTS_IN_6_2"
|
|
// list. If the code point is found in list
|
|
// "UNASSIGNED_CODEPOINTS_IN_6_2", value of variable
|
|
// "expected" is considered false.
|
|
if (!UNASSIGNED_CODEPOINTS_IN_6_2.contains(i)) {
|
|
byte type = (byte) Character.getType(ch);
|
|
expected = Character.isLetter(ch)
|
|
|| type == Character.LETTER_NUMBER
|
|
|| type == Character.CURRENCY_SYMBOL
|
|
|| type == Character.CONNECTOR_PUNCTUATION;
|
|
}
|
|
|
|
if (Character.isJavaIdentifierStart(ch) != expected) {
|
|
throw new RuntimeException(
|
|
"Character.isJavaIdentifierStart(char) failed for codepoint "
|
|
+ Integer.toHexString(i));
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Assertion testing for public static boolean isJavaLetter(char ch), A
|
|
* character may start a Java identifier if and only if one of the
|
|
* following is true:
|
|
* <ul>
|
|
* <li>isLetter(ch) returns true
|
|
* <li>getType(ch) returns LETTER_NUMBER
|
|
* <li>ch is a currency symbol (such as "$")
|
|
* <li>ch is a connecting punctuation character (such as "_").
|
|
* </ul>
|
|
* All Unicode code points in the BMP (0x0000..0xFFFF) are tested.
|
|
*/
|
|
public static void testIsJavaLetter() {
|
|
for (int i = 0; i <= Character.MAX_VALUE; ++i) {
|
|
char ch = (char) i;
|
|
boolean expected = false;
|
|
// Since Character.isJavaLetter(char) strictly conforms to
|
|
// character information from version 6.2 of the Unicode Standard,
|
|
// check if code point is in "UNASSIGNED_CODEPOINTS_IN_6_2"
|
|
// list. If the code point is found in list
|
|
// "UNASSIGNED_CODEPOINTS_IN_6_2", value of variable
|
|
// "expected" is considered false.
|
|
if (!UNASSIGNED_CODEPOINTS_IN_6_2.contains(i)) {
|
|
byte type = (byte) Character.getType(ch);
|
|
expected = Character.isLetter(ch)
|
|
|| type == Character.LETTER_NUMBER
|
|
|| type == Character.CURRENCY_SYMBOL
|
|
|| type == Character.CONNECTOR_PUNCTUATION;
|
|
}
|
|
|
|
if (Character.isJavaLetter(ch) != expected) {
|
|
throw new RuntimeException(
|
|
"Character.isJavaLetter(ch) failed for codepoint "
|
|
+ Integer.toHexString(i));
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Assertion testing for public static boolean isJavaLetterOrDigit(char
|
|
* ch), A character may be part of a Java identifier if and only if any
|
|
* of the following are true:
|
|
* <ul>
|
|
* <li>it is a letter
|
|
* <li>it is a currency symbol (such as '$')
|
|
* <li>it is a connecting punctuation character (such as '_')
|
|
* <li>it is a digit
|
|
* <li>it is a numeric letter (such as a Roman numeral character)
|
|
* <li>it is a combining mark
|
|
* <li>it is a non-spacing mark
|
|
* <li>isIdentifierIgnorable returns true for the character.
|
|
* </ul>
|
|
* All Unicode code points in the BMP (0x0000..0xFFFF) are tested.
|
|
*/
|
|
public static void testIsJavaLetterOrDigit() {
|
|
for (int i = 0; i <= Character.MAX_VALUE; ++i) {
|
|
char ch = (char) i;
|
|
boolean expected = false;
|
|
// Since Character.isJavaLetterOrDigit(char) strictly conforms to
|
|
// character information from version 6.2 of the Unicode Standard,
|
|
// check if code point is in "UNASSIGNED_CODEPOINTS_IN_6_2"
|
|
// list. If the code point is found in list
|
|
// "UNASSIGNED_CODEPOINTS_IN_6_2", value of variable
|
|
// "expected" is considered false.
|
|
if (!UNASSIGNED_CODEPOINTS_IN_6_2.contains(i)) {
|
|
byte type = (byte) Character.getType(ch);
|
|
expected = Character.isLetter(ch)
|
|
|| type == Character.CURRENCY_SYMBOL
|
|
|| type == Character.CONNECTOR_PUNCTUATION
|
|
|| Character.isDigit(ch)
|
|
|| type == Character.LETTER_NUMBER
|
|
|| type == Character.COMBINING_SPACING_MARK
|
|
|| type == Character.NON_SPACING_MARK
|
|
|| Character.isIdentifierIgnorable(ch);
|
|
}
|
|
|
|
if (Character.isJavaLetterOrDigit(ch) != expected) {
|
|
throw new RuntimeException(
|
|
"Character.isJavaLetterOrDigit(ch) failed for codepoint "
|
|
+ Integer.toHexString(i));
|
|
}
|
|
}
|
|
}
|
|
}
|