New test/java/lang/String/ToUpperCase.java

   1 /*
   2  * Copyright (c) 2000, 2003, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  20  * or visit www.oracle.com if you need additional information or have any
  21  * questions.
  22  */
  23 
  24 /*
  25     @test
  26     @bug 4219630 4304573 4533872 4900935 8042589 8054307
  27     @summary toUpperCase should upper-case German sharp s correctly even if
  28              it's the only character in the string. should also uppercase
  29              all of the 1:M char mappings correctly.  Also it should handle
  30              Locale specific (lt, tr, and az) uppercasings and supplementary
  31              characters correctly.
  32 */
  33 
  34 import java.util.Locale;
  35 
  36 public class ToUpperCase {
  37 
  38     public static void main(String[] args) {
  39         Locale turkish = new Locale("tr", "TR");
  40         Locale lt = new Locale("lt"); // Lithanian
  41         Locale az = new Locale("az"); // Azeri
  42 
  43         test("\u00DF", turkish, "SS");
  44         test("a\u00DF", turkish, "ASS");
  45         test("i", turkish, "\u0130");
  46         test("i", az, "\u0130");
  47         test("\u0131", turkish, "I");
  48         test("\u00DF", Locale.GERMANY, "SS");
  49         test("a\u00DF", Locale.GERMANY, "ASS");
  50         test("i", Locale.GERMANY, "I");
  51 
  52         // test some of the 1:M uppercase mappings
  53         test("abc\u00DF", Locale.US, "ABC\u0053\u0053");
  54         test("\u0149abc", Locale.US, "\u02BC\u004EABC");
  55         test("\u0149abc", turkish, "\u02BC\u004EABC");
  56         test("\u1F52", Locale.US, "\u03A5\u0313\u0300");
  57         test("\u0149\u1F52", Locale.US, "\u02BC\u004E\u03A5\u0313\u0300");
  58         test("\u1F54ZZZ", Locale.US, "\u03A5\u0313\u0301ZZZ");
  59         test("\u1F54ZZZ", turkish, "\u03A5\u0313\u0301ZZZ");
  60         test("a\u00DF\u1F56", Locale.US, "ASS\u03A5\u0313\u0342");
  61         test("\u1FAD", turkish, "\u1F6D\u0399");
  62         test("i\u1FC7", turkish, "\u0130\u0397\u0342\u0399");
  63         test("i\u1FC7", az, "\u0130\u0397\u0342\u0399");
  64         test("i\u1FC7", Locale.US, "I\u0397\u0342\u0399");
  65         test("\uFB04", Locale.US, "\u0046\u0046\u004C");
  66         test("\uFB17AbCdEfi", turkish, "\u0544\u053DABCDEF\u0130");
  67         test("\uFB17AbCdEfi", az, "\u0544\u053DABCDEF\u0130");
  68 
  69         // Remove DOT ABOVE after "i" in Lithuanian
  70         test("i\u0307", lt, "I");
  71         test("\u0307", lt, "\u0307");
  72         test("\u0307i", lt, "\u0307I");
  73         test("j\u0307", lt, "J");
  74         test("abci\u0307def", lt, "ABCIDEF");
  75         test("a\u0307", lt, "A\u0307");
  76         test("abc\u0307def", lt, "ABC\u0307DEF");
  77         test("i\u0307", Locale.US, "I\u0307");
  78         test("i\u0307", turkish, "\u0130\u0307");
  79 
  80         // Supplementary character tests
  81         //
  82         // U+10400 ("\uD801\uDC00"): DESERET CAPITAL LETTER LONG I
  83         // U+10401 ("\uD801\uDC01"): DESERET CAPITAL LETTER LONG E
  84         // U+10402 ("\uD801\uDC02"): DESERET CAPITAL LETTER LONG A
  85         // U+10428 ("\uD801\uDC28"): DESERET SMALL LETTER LONG I
  86         // U+10429 ("\uD801\uDC29"): DESERET SMALL LETTER LONG E
  87         // U+1042A ("\uD801\uDC2A"): DESERET SMALL LETTER LONG A
  88         //
  89         // valid code point tests:
  90         test("\uD801\uDC28\uD801\uDC29\uD801\uDC2A", Locale.US, "\uD801\uDC00\uD801\uDC01\uD801\uDC02");
  91         test("\uD801\uDC28a\uD801\uDC29b\uD801\uDC2Ac", Locale.US, "\uD801\uDC00A\uD801\uDC01B\uD801\uDC02C");
  92         // invalid code point tests:
  93         test("\uD800\uD800\uD801a\uDC00\uDC00\uDC00b", Locale.US, "\uD800\uD800\uD801A\uDC00\uDC00\uDC00B");
  94 
  95         // lower/uppercase + surrogates
  96         test("a\uD801\uDC44", Locale.ROOT, "A\uD801\uDC1c");
  97         test("A\uD801\uDC44", Locale.ROOT, "A\uD801\uDC1c");
  98         test("a\uD801\uDC28\uD801\uDC29\uD801\uDC2A", Locale.US, "A\uD801\uDC00\uD801\uDC01\uD801\uDC02");
  99         test("A\uD801\uDC28a\uD801\uDC29b\uD801\uDC2Ac", Locale.US, "A\uD801\uDC00A\uD801\uDC01B\uD801\uDC02C");
 100 
 101         // test latin1 only case
 102         StringBuilder src = new StringBuilder(0x100);
 103         StringBuilder exp = new StringBuilder(0x100);
 104         for (int cp = 0; cp < 0x100; cp++) {
 105             int upperCase = Character.toUpperCase(cp);
 106             if (upperCase == -1) {    //Character.ERROR
 107                 continue;
 108             }
 109             src.appendCodePoint(cp);
 110             if (cp == '\u00df') {
 111                 exp.append("SS");     // need Character.toUpperCaseEx()
 112             } else {
 113                 exp.appendCodePoint(upperCase);
 114             }
 115         }
 116         test(src.toString(), Locale.US, exp.toString());
 117 
 118         // test non-latin1 -> latin1
 119         src = new StringBuilder(0x100).append("ABC");
 120         exp = new StringBuilder(0x100).append("ABC");
 121         for (int cp = 0x100; cp < 0x10000; cp++) {
 122             int upperCase  = Character.toUpperCase(cp);
 123             if (upperCase < 0x100) {
 124                 src.appendCodePoint(cp);
 125                 exp.appendCodePoint(upperCase);
 126             }
 127         }
 128         test(src.toString(), Locale.US, exp.toString());
 129 
 130     }
 131 
 132     static void test(String in, Locale locale, String expected) {
 133         test0(in, locale,expected);
 134         // trigger different code paths
 135         for (String[] ss :  new String[][] {
 136                                 new String[] {"abc",      "ABC"},
 137                                 new String[] {"AbC",      "ABC"},
 138                                 new String[] {"ABC",      "ABC"},
 139                                 new String[] {"AB\u4e00", "AB\u4e00"},
 140                                 new String[] {"ab\u4e00", "AB\u4e00"},
 141                                 new String[] {"aB\u4e00", "AB\u4e00"},
 142                                 new String[] {"AB\uD800\uDC00", "AB\uD800\uDC00"},
 143                                 new String[] {"Ab\uD800\uDC00", "AB\uD800\uDC00"},
 144                                 new String[] {"ab\uD800\uDC00", "AB\uD800\uDC00"},
 145                                 new String[] {"AB\uD801\uDC44", "AB\uD801\uDC1C"},
 146                                 new String[] {"Ab\uD801\uDC44", "AB\uD801\uDC1C"},
 147                                 new String[] {"ab\uD801\uDC44", "AB\uD801\uDC1C"},
 148                             }) {
 149             test0(ss[0] + " " + in, locale, ss[1] + " " + expected);
 150             test0(in + " " + ss[0], locale, expected + " " + ss[1]);
 151         }
 152     }
 153 
 154     static void test0(String in, Locale locale, String expected) {
 155         String result = in.toUpperCase(locale);
 156         if (!result.equals(expected)) {
 157             System.err.println("input: " + in + ", locale: " + locale +
 158                     ", expected: " + expected + ", actual: " + result);
 159             throw new RuntimeException();
 160         }
 161     }
 162 }