aboutsummaryrefslogtreecommitdiff
path: root/libjava/java/lang/natCharacter.cc
diff options
context:
space:
mode:
authorAnthony Balkissoon <abalkiss@redhat.com>2006-03-28 16:12:52 +0000
committerAnthony Balkissoon <abalkiss@gcc.gnu.org>2006-03-28 16:12:52 +0000
commit792617a52abfb67c52c6bec3a431fdc193773786 (patch)
tree33d3cdf25e29b600aa40340320a592051654c632 /libjava/java/lang/natCharacter.cc
parent72922229b7431aac7f5ac3d207a017473dccce4d (diff)
downloadgcc-792617a52abfb67c52c6bec3a431fdc193773786.zip
gcc-792617a52abfb67c52c6bec3a431fdc193773786.tar.gz
gcc-792617a52abfb67c52c6bec3a431fdc193773786.tar.bz2
unicode-muncher.pl: Removed this file.
2006-03-28 Anthony Balkissoon <abalkiss@redhat.com> * scripts/unicode-muncher.pl: Removed this file. * scripts/MakeCharTables.java: Likewise. * scripts/unicode-to-chartables.pl: New file. * java/lang/natCharacter.cc: (UNASSIGNED_TYPE): New field. (UNASSIGNED_DIGIT): Likewise. (UNASSIGNED_DIRECTION): Likewise. (UNASSIGNED_NUMERIC_VALUE): Likewise. (PRIVATE_TYPE): Likewise. (PRIVATE_DIRECTION): Likewise. (readCodePoint): New method. (getType(jint)): Likewise. (toLowerCase(jint)): Likewise. (toUpperCase(jint)): Likewise. (toTitleCase(jint)): Likewise. (digit(jint, jint)): Likewise. (getNumericValue(jint)): Likewise. (getDirectionality(jint)): Likewise. (readChar), (getType(jchar)), (toLowerCase(jchar)), (toUpperCase(jchar)), (toTitleCase(jchar)), (digit(jchar, jint)), (getNumericValue(jchar)), (getDirectionality(jchar)): Changed references from data to data[0], blocks to blocks[0], direction to direction[0], numValue to numValue[0], upper to upper[0], lower to lower[0], and shift to shift[0] to reflect the new structures in java-chartables.h. * java/lang/Character.java: (readCodePoint): Declared new native method. (getType(int)): Likewise. (toLowerCase(int)): Likewise. (toUpperCase(int)): Likewise. (toTitleCase(int)): Likewise. (digit(int, int)): Likewise. (getNumericValue(int)): Likewise. (getDirectionality(int)): Likewise. (isLowerCase(int)): New method. (isUpperCase(int)): Likewise. (itTitleCase(int)): Likewise. (isDigit(int)): Likewise. (isDefined(int)): Likewise. (isLetter(int)): Likewise. (isLetterOrDigit(int)): Likewise. (isJavaIdentifierStart(int)): Likewise. (isJavaIdentifierPart(int)): Likewise. (isUnicodeIdentifierStart(int)): Likewise. (isUnicodeIdentifierPart(int)): Likewise. (isIdentifierIgnorable(int)): Likewise. (isSpaceChar(int)): Likewise. (isWhitespace(int)): Likewise. (isISOControl(int)): Likewise. (isMirrored(int)): Likewise. * include/java-chartables.h: Generated from scripts/unicode-to-chartables.h. From-SVN: r112454
Diffstat (limited to 'libjava/java/lang/natCharacter.cc')
-rw-r--r--libjava/java/lang/natCharacter.cc138
1 files changed, 131 insertions, 7 deletions
diff --git a/libjava/java/lang/natCharacter.cc b/libjava/java/lang/natCharacter.cc
index e9362fe..8d246dd 100644
--- a/libjava/java/lang/natCharacter.cc
+++ b/libjava/java/lang/natCharacter.cc
@@ -45,30 +45,91 @@ exception statement from your version. */
+// These constants define the return values for characters that are unassigned
+// or reserved for private use.
+#define UNASSIGNED_TYPE 0
+#define UNASSIGNED_DIGIT -1
+#define UNASSIGNED_DIRECTION -1
+#define UNASSIGNED_NUMERIC_VALUE -1
+
+#define PRIVATE_TYPE 18
+#define PRIVATE_DIRECTION 0
+
+// The methods that take a char as an argument all have counterparts that
+// take ints. The ones that take chars only work for the BMP or plane 0 of the
+// Unicode standard but the ones that take ints work for all Unicode code
+// points. However, the ones that take chars don't simply redirect the calls
+// because the BMP is by far the most used plane so saving a little time on
+// each call makes sense.
+
jchar
java::lang::Character::readChar(jchar ch)
{
// Perform 16-bit addition to find the correct entry in data.
- return data[(jchar) (blocks[ch >> SHIFT] + ch)];
+ return data[0][(jchar) (blocks[0][ch >> shift[0]] + ch)];
+}
+
+jchar
+java::lang::Character::readCodePoint(jint codePoint)
+{
+ jint plane = codePoint >> 16;
+ jchar offset = (jchar)(codePoint & 0xffff);
+ // Be careful not to call this method with an unassigned character. The only
+ // characters assigned as of Unicode 4.0.0 belong to planes 0, 1, 2, and 14.
+ return data[plane][(jchar) (blocks[plane][offset >> shift[plane]] + offset)];
}
jint
java::lang::Character::getType(jchar ch)
{
// Perform 16-bit addition to find the correct entry in data.
- return (jint) (data[(jchar) (blocks[ch >> SHIFT] + ch)] & TYPE_MASK);
+ return (jint) (data[0][(jchar) (blocks[0][ch >> shift[0]] + ch)] & TYPE_MASK);
+}
+
+jint
+java::lang::Character::getType(jint codePoint)
+{
+ jint plane = codePoint >> 16;
+ if (plane > 2 && plane != 14)
+ {
+ if (plane > 14 && ((codePoint & 0xffff) < 0xfffe))
+ return (jint) PRIVATE_TYPE;
+ return (jint) UNASSIGNED_TYPE;
+ }
+ jint offset = codePoint & 0xffff;
+ return (jint)
+ (data[plane]
+ [(jchar) (blocks[plane][offset >> shift[plane]] + offset)] & TYPE_MASK);
}
jchar
java::lang::Character::toLowerCase(jchar ch)
{
- return (jchar) (ch + lower[readChar(ch) >> 7]);
+ return (jchar) (ch + lower[0][readChar(ch) >> 7]);
+}
+
+jint
+java::lang::Character::toLowerCase(jint codePoint)
+{
+ jint plane = codePoint >> 16;
+ if (plane > 2 && plane != 14)
+ return codePoint;
+ return (lower[plane][readCodePoint(codePoint) >> 7]) + codePoint;
}
jchar
java::lang::Character::toUpperCase(jchar ch)
{
- return (jchar) (ch + upper[readChar(ch) >> 7]);
+ return (jchar) (ch + upper[0][readChar(ch) >> 7]);
+}
+
+jint
+java::lang::Character::toUpperCase(jint codePoint)
+{
+ jint plane = codePoint >> 16;
+ if (plane > 2 && plane != 14)
+ return codePoint;
+ return (upper[plane][readCodePoint(codePoint) >> 7]) + codePoint;
}
jchar
@@ -82,6 +143,16 @@ java::lang::Character::toTitleCase(jchar ch)
}
jint
+java::lang::Character::toTitleCase(jint codePoint)
+{
+ // As of Unicode 4.0.0 no characters outside of plane 0 have titlecase
+ // mappings that are different from their uppercase mapping.
+ if (codePoint < 0x10000)
+ return toTitleCase((jchar)codePoint);
+ return toUpperCase(codePoint);
+}
+
+jint
java::lang::Character::digit(jchar ch, jint radix)
{
if (radix < MIN_RADIX || radix > MAX_RADIX)
@@ -93,21 +164,74 @@ java::lang::Character::digit(jchar ch, jint radix)
| (1 << DECIMAL_DIGIT_NUMBER))))
{
// Signedness doesn't matter; 0xffff vs. -1 are both rejected.
- jint digit = (jint) numValue[attr >> 7];
+ jint digit = (jint) numValue[0][attr >> 7];
return (digit >= 0 && digit < radix) ? digit : (jint) -1;
}
return (jint) -1;
}
jint
+java::lang::Character::digit(jint codePoint, jint radix)
+{
+ if (radix < MIN_RADIX || radix > MAX_RADIX)
+ return (jint) -1;
+
+ jint plane = codePoint >> 16;
+ if (plane > 2 && plane != 14)
+ return UNASSIGNED_DIGIT;
+
+ jchar attr = readCodePoint(codePoint);
+ if (((1 << (attr & TYPE_MASK))
+ & ((1 << UPPERCASE_LETTER)
+ | (1 << LOWERCASE_LETTER)
+ | (1 << DECIMAL_DIGIT_NUMBER))))
+ {
+ // Signedness doesn't matter; 0xffff vs. -1 are both rejected.
+ jint digit = (jint) numValue[plane][attr >> 7];
+ if (digit <= -3)
+ digit = largenums[-digit -3];
+ return (digit >= 0 && digit < radix) ? digit : (jint) -1;
+ }
+ return (jint) -1;
+
+}
+
+jint
java::lang::Character::getNumericValue(jchar ch)
{
// numValue is stored as an array of jshort, since 10000 is the maximum.
- return (jint) numValue[readChar(ch) >> 7];
+ return (jint) numValue[0][readChar(ch) >> 7];
+}
+
+jint
+java::lang::Character::getNumericValue(jint codePoint)
+{
+ jint plane = codePoint >> 16;
+ if (plane > 2 && plane != 14)
+ return UNASSIGNED_NUMERIC_VALUE;
+ jshort num = numValue[plane][readCodePoint(codePoint) >> 7];
+ if (num <= -3)
+ return largenums[-num - 3];
+ return num;
}
jbyte
java::lang::Character::getDirectionality(jchar ch)
{
- return direction[readChar(ch) >> 7];
+ return direction[0][readChar(ch) >> 7];
}
+
+jbyte
+java::lang::Character::getDirectionality(jint codePoint)
+{
+ jint plane = codePoint >> 16;
+ if (plane > 2 && plane != 14)
+ {
+ if (plane > 14 && ((codePoint & 0xffff) < 0xfffe))
+ return (jint) PRIVATE_DIRECTION;
+ return (jint) UNASSIGNED_DIRECTION;
+ }
+ return direction[plane][readCodePoint(codePoint) >> 7];
+}
+
+