/* * Copyright (c) 2003, 2022, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA * or visit www.oracle.com if you need additional information or have any * questions.
*/
/* @test @bug 4217441 4533872 4900935 8020037 8032012 8041791 8042589 8054307 @summary toLowerCase should lower-case Greek Sigma correctly depending on the context (final/non-final). Also it should handle Locale specific (lt, tr, and az) lowercasings and supplementary characters correctly.
*/
// Remove dot_above in the sequence I + dot_above (Turkish and Azeri)
test("I\u0307", turkish, "i");
test("I\u0307", az, "i");
test("J\u0307", turkish, "j\u0307");
test("J\u0307", az, "j\u0307");
// Unless an I is before a dot_above, it turns into a dotless i (Turkish and Azeri)
test("I", turkish, "\u0131");
test("I", az, "\u0131");
test("I", Locale.US, "i");
test("IABC", turkish, "\u0131abc");
test("IABC", az, "\u0131abc");
test("IABC", Locale.US, "iabc");
// Supplementary character tests // // U+10400 ("\uD801\uDC00"): DESERET CAPITAL LETTER LONG I // U+10401 ("\uD801\uDC01"): DESERET CAPITAL LETTER LONG E // U+10402 ("\uD801\uDC02"): DESERET CAPITAL LETTER LONG A // U+10428 ("\uD801\uDC28"): DESERET SMALL LETTER LONG I // U+10429 ("\uD801\uDC29"): DESERET SMALL LETTER LONG E // U+1042A ("\uD801\uDC2A"): DESERET SMALL LETTER LONG A // // valid code point tests:
test("\uD801\uDC00\uD801\uDC01\uD801\uDC02", Locale.US, "\uD801\uDC28\uD801\uDC29\uD801\uDC2A");
test("\uD801\uDC00A\uD801\uDC01B\uD801\uDC02C", Locale.US, "\uD801\uDC28a\uD801\uDC29b\uD801\uDC2Ac"); // invalid code point tests:
test("\uD800\uD800\uD801A\uDC00\uDC00\uDC00B", Locale.US, "\uD800\uD800\uD801a\uDC00\uDC00\uDC00b");
// test bmp + supp1
StringBuilder src = new StringBuilder(0x20000);
StringBuilder exp = new StringBuilder(0x20000); for (int cp = 0; cp < 0x20000; cp++) { if (cp >= Character.MIN_HIGH_SURROGATE && cp <= Character.MAX_HIGH_SURROGATE) { continue;
} if (cp == 0x0130) { // Although UnicodeData.txt has the lower case char as \u0069, it should be // handled with the rules in SpecialCasing.txt, i.e., \u0069\u0307 in // non Turkic locales. continue;
} int lowerCase = Character.toLowerCase(cp); if (lowerCase == -1) { //Character.ERROR continue;
}
src.appendCodePoint(cp);
exp.appendCodePoint(lowerCase);
}
test(src.toString(), Locale.US, exp.toString());
// test latin1
src = new StringBuilder(0x100);
exp = new StringBuilder(0x100); for (int cp = 0; cp < 0x100; cp++) { int lowerCase = Character.toLowerCase(cp); if (lowerCase == -1) { //Character.ERROR continue;
}
src.appendCodePoint(cp);
exp.appendCodePoint(lowerCase);
}
test(src.toString(), Locale.US, exp.toString());
// test non-latin1 -> latin1
src = new StringBuilder(0x100).append("abc");
exp = new StringBuilder(0x100).append("abc"); for (int cp = 0x100; cp < 0x10000; cp++) { int lowerCase = Character.toLowerCase(cp); if (lowerCase < 0x100 && cp != '\u0130') {
src.appendCodePoint(cp);
exp.appendCodePoint(lowerCase);
}
}
test(src.toString(), Locale.US, exp.toString());
}
staticvoid test(String in, Locale locale, String expected) {
test0(in, locale,expected); for (String[] ss : new String[][] { new String[] {"abc", "abc"}, new String[] {"aBc", "abc"}, new String[] {"ABC", "abc"}, new String[] {"ab\u4e00", "ab\u4e00"}, new String[] {"aB\u4e00", "ab\u4e00"}, new String[] {"AB\u4e00", "ab\u4e00"}, new String[] {"ab\uD800\uDC00", "ab\uD800\uDC00"}, new String[] {"aB\uD800\uDC00", "ab\uD800\uDC00"}, new String[] {"AB\uD800\uDC00", "ab\uD800\uDC00"}, new String[] {"ab\uD801\uDC1C", "ab\uD801\uDC44"}, new String[] {"aB\uD801\uDC1C", "ab\uD801\uDC44"}, new String[] {"AB\uD801\uDC1C", "ab\uD801\uDC44"},
Die Informationen auf dieser Webseite wurden
nach bestem Wissen sorgfältig zusammengestellt. Es wird jedoch weder Vollständigkeit, noch Richtigkeit,
noch Qualität der bereit gestellten Informationen zugesichert.
Bemerkung:
Die farbliche Syntaxdarstellung ist noch experimentell.