/* * Copyright (c) 2007, 2012, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA * or visit www.oracle.com if you need additional information or have any * questions. */ /* * @test * @bug 5030265 * @compile -XDignore.symbol.file UnicodeTest.java * @run main/othervm UnicodeTest * @summary Verify that the J2RE can handle all legal Unicode characters * in class names unless limited by the file system encoding * or the encoding used for command line arguments. * @author Norbert Lindenberg, ksrini */ /* * This class creates Java source files using Unicode characters * that test the limits of what's possible * - in situations where the platform encoding imposes limits * (command line arguments, non-Unicode file system) * - in situations where full Unicode is supported * (file system access in UTF-8 locales and on Windows 2000++, * jar file contents) * * This test needs to be run in othervm as the locale is reset. */ import java.io.File; import java.io.FileOutputStream; import java.io.OutputStreamWriter; import java.nio.charset.Charset; import java.util.Locale; public class UnicodeTest extends TestHelper { static final File UnicodeTestSrc = new File("UnicodeTest-src"); static final File UnicodeTestClasses = new File("UnicodeTest-classes"); static final String UnicodeTestJarName = "UnicodeTest" + JAR_FILE_EXT; static final File UnicodeTestJar = new File(UnicodeTestJarName); static final File SolarisUnicodeTestJar = new File(TEST_SOURCES_DIR, UnicodeTestJarName); /* * the main method is a port of the shell based test to a java, this * eliminates the need for MKS on windows, thus we can rely on consistent * results regardless of the shell being used. */ public static void main(String... args) throws Exception { System.out.println("creating test source files"); UnicodeTestSrc.mkdirs(); UnicodeTestClasses.mkdirs(); String classname = generateSources(); File javaFile = new File(UnicodeTestSrc, classname + JAVA_FILE_EXT); System.out.println("building test apps"); compile("-encoding", "UTF-8", "-sourcepath", UnicodeTestSrc.getAbsolutePath(), "-d", UnicodeTestClasses.getAbsolutePath(), javaFile.getAbsolutePath()); createJar("-cvfm", UnicodeTestJar.getAbsolutePath(), new File(UnicodeTestSrc, "MANIFEST.MF").getAbsolutePath(), "-C", UnicodeTestClasses.getAbsolutePath(), "."); if (!UnicodeTestJar.exists()) { throw new Error("failed to create " + UnicodeTestJar.getAbsolutePath()); } System.out.println("running test app using class file"); TestResult tr = doExec(javaCmd, "-cp", UnicodeTestClasses.getAbsolutePath(), classname); if (!tr.isOK()) { System.out.println(tr); throw new RuntimeException("test fails"); } System.out.println("delete generated files with non-ASCII names"); recursiveDelete(UnicodeTestSrc); recursiveDelete(UnicodeTestClasses); /* * test in whatever the default locale is */ runJarTests(); /* * if the Japanese locale is available, test in that locale as well */ if (setLocale(Locale.JAPANESE)) { runJarTests(); } /* * if we can switch to a C locale, then test whether jar files with * non-ASCII characters in the manifest still work in this crippled * environment */ if (setLocale(Locale.ENGLISH)) { runJarTests(); } // thats it we are outta here } static void runJarTests() { System.out.println("running test app using newly built jar file in " + Locale.getDefault()); runTest(UnicodeTestJar); System.out.println("running test app using jar file " + "(built with Solaris UTF-8 locale) in " + Locale.getDefault()); runTest(SolarisUnicodeTestJar); } static void runTest(File testJar) { TestResult tr = doExec(javaCmd, "-jar", testJar.getAbsolutePath()); if (!tr.isOK()) { System.out.println(tr); throw new RuntimeException("test fails"); } } static boolean setLocale(Locale desired) { if (Locale.getDefault().equals(desired)) { return true; // already set nothing more } for (Locale l : Locale.getAvailableLocales()) { if (l == desired) { Locale.setDefault(l); return true; } } return false; } static String generateSources() throws Exception { String commandLineClassNameSuffix = commandLineClassNameSuffix(); String commandLineClassName = "ClassA" + commandLineClassNameSuffix; String manifestClassName = "ClassB" + (hasUnicodeFileSystem() ? unicode : commandLineClassNameSuffix); generateSource(commandLineClassName, manifestClassName); generateSource(manifestClassName, commandLineClassName); generateManifest(manifestClassName); return commandLineClassName; } private static final String defaultEncoding = Charset.defaultCharset().name(); // language names taken from java.util.Locale.getDisplayLanguage for the respective language private static final String arabic = "\u0627\u0644\u0639\u0631\u0628\u064a\u0629"; private static final String s_chinese = "\u4e2d\u6587"; private static final String t_chinese = "\u4e2d\u6587"; private static final String russian = "\u0440\u0443\u0441\u0441\u043A\u0438\u0439"; private static final String hindi = "\u0939\u093f\u0902\u0926\u0940"; private static final String greek = "\u03b5\u03bb\u03bb\u03b7\u03bd\u03b9\u03ba\u03ac"; private static final String hebrew = "\u05e2\u05d1\u05e8\u05d9\u05ea"; private static final String japanese = "\u65e5\u672c\u8a9e"; private static final String korean = "\ud55c\uad6d\uc5b4"; private static final String lithuanian = "Lietuvi\u0173"; private static final String czech = "\u010de\u0161tina"; private static final String turkish = "T\u00fcrk\u00e7e"; private static final String spanish = "espa\u00f1ol"; private static final String thai = "\u0e44\u0e17\u0e22"; private static final String unicode = arabic + s_chinese + t_chinese + russian + hindi + greek + hebrew + japanese + korean + lithuanian + czech + turkish + spanish + thai; private static String commandLineClassNameSuffix() { // Mapping from main platform encodings to language names // for Unix and Windows, respectively. Use empty suffix // for Windows encodings where OEM encoding differs. // Use null if encoding isn't used. String[][] names = { { "UTF-8", unicode, "" }, { "windows-1256", null, "" }, { "iso-8859-6", arabic, null }, { "GBK", s_chinese, s_chinese }, { "GB18030", s_chinese, s_chinese }, { "GB2312", s_chinese, null }, { "x-windows-950", null, t_chinese }, { "x-MS950-HKSCS", null, t_chinese }, { "x-euc-tw", t_chinese, null }, { "Big5", t_chinese, null }, { "Big5-HKSCS", t_chinese, null }, { "windows-1251", null, "" }, { "iso-8859-5", russian, null }, { "koi8-r", russian, null }, { "windows-1253", null, "" }, { "iso-8859-7", greek, null }, { "windows-1255", null, "" }, { "iso8859-8", hebrew, null }, { "windows-31j", null, japanese }, { "x-eucJP-Open", japanese, null }, { "x-EUC-JP-LINUX", japanese, null }, { "x-pck", japanese, null }, { "x-windows-949", null, korean }, { "euc-kr", korean, null }, { "windows-1257", null, "" }, { "iso-8859-13", lithuanian, null }, { "windows-1250", null, "" }, { "iso-8859-2", czech, null }, { "windows-1254", null, "" }, { "iso-8859-9", turkish, null }, { "windows-1252", null, "" }, { "iso-8859-1", spanish, null }, { "iso-8859-15", spanish, null }, { "x-windows-874", null, thai }, { "tis-620", thai, null }, }; int column = isWindows ? 2 : 1; for (int i = 0; i < names.length; i++) { if (names[i][0].equalsIgnoreCase(defaultEncoding)) { return names[i][column]; } } return ""; } private static boolean hasUnicodeFileSystem() { return (isWindows) ? true : defaultEncoding.equalsIgnoreCase("UTF-8"); } private static void generateSource(String thisClass, String otherClass) throws Exception { File file = new File(UnicodeTestSrc, thisClass + JAVA_FILE_EXT); OutputStreamWriter out = new OutputStreamWriter(new FileOutputStream(file), "UTF-8"); out.write("public class " + thisClass + " {\n"); out.write(" public static void main(String[] args) {\n"); out.write(" if (!" + otherClass + "." + otherClass.toLowerCase() + "().equals(\"" + otherClass + "\")) {\n"); out.write(" throw new RuntimeException();\n"); out.write(" }\n"); out.write(" }\n"); out.write(" public static String " + thisClass.toLowerCase() + "() {\n"); out.write(" return \"" + thisClass + "\";\n"); out.write(" }\n"); out.write("}\n"); out.close(); } private static void generateManifest(String mainClass) throws Exception { File file = new File(UnicodeTestSrc, "MANIFEST.MF"); FileOutputStream out = new FileOutputStream(file); out.write("Manifest-Version: 1.0\n".getBytes("UTF-8")); // Header lines are limited to 72 bytes. // The manifest spec doesn't say we have to break at character boundaries, // so we rudely break at byte boundaries. byte[] headerBytes = ("Main-Class: " + mainClass + "\n").getBytes("UTF-8"); if (headerBytes.length <= 72) { out.write(headerBytes); } else { out.write(headerBytes, 0, 72); int start = 72; while (headerBytes.length > start) { out.write((byte) '\n'); out.write((byte) ' '); int count = Math.min(71, headerBytes.length - start); out.write(headerBytes, start, count); start += count; } } out.close(); } }