TestUTF_32.java example

Explorer
openjdk-master
/*
 * Copyright (c) 2008, Oracle and/or its affiliates. All rights reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 * or visit www.oracle.com if you need additional information or have any
 * questions.
 */

/*
   @bug 6346419
   @summary Check correctness of the UTF-32 and its variant charsets
 */

import java.io.*;
import java.nio.*;
import java.nio.charset.*;

public class TestUTF_32 {
    private static void testDecode(String charset,
                                   String expected,
                                   byte[] input)
        throws Exception
    {
        String out = new String(input, charset);
        if (!out.equals(expected)) {
            failureReport (out, expected);
            throw new Exception("UTF_32 Decoding test failed: " + charset);
        }
    }

    private static void testEncode(String charset,
                                   String input,
                                   byte[] expected)
        throws Exception
    {
        byte[] testBytes = input.getBytes(charset);
        for (int i = 0; i< expected.length; i++)
            if (testBytes[i] != expected[i])
                throw new Exception("UTF_32 Encoding test failed: [" + i + "]"+ charset);

    }

    private static void warn(String s) {
        System.err.println("FAILED Test UTF-32:" +
                            s) ;
    }

    private static void failureReport(String testStr,
                                      String expected) {
        System.err.println ("Expected Characters:");
        for (int i = 0; i < expected.length() ; i++) {
            warn("expected char[" + i + "] : " +
                  Integer.toHexString((int)expected.charAt(i)) +
                 "obtained char[" + i + "] : " +
                  Integer.toHexString((int)testStr.charAt(i)));
        }
    }

    private static void writeInt(OutputStream os, int i, boolean isBig)
        throws Exception
    {
        if (isBig) {
            os.write((i>>24) & 0xff);
            os.write((i>>16) & 0xff);
            os.write((i>>8) & 0xff);
            os.write(i & 0xff);
        } else {
            os.write(i & 0xff);
            os.write((i>>8) & 0xff);
            os.write((i>>16) & 0xff);
            os.write((i>>24) & 0xff);
        }
    }

    private static byte[] getBytes(boolean doBOM, boolean isBig)
        throws Exception
    {
        ByteArrayOutputStream baos = new ByteArrayOutputStream(1024*1024);
        if (doBOM)
           writeInt(baos, 0xfeff, isBig);

        for (int i = 0; i < 0xffff; i++) {
            if (i < Character.MIN_SURROGATE ||
                i > Character.MAX_SURROGATE)
            writeInt(baos, i, isBig);
        }
        for (int i = 0x10000; i < 0x1ffff; i++) {
            writeInt(baos, i, isBig);
        }

        for (int i = 0x100000; i < 0x10ffff; i++) {
            writeInt(baos, i, isBig);
        }
        byte[] bb = baos.toByteArray();
        baos.close();
        return bb;
    }

    public static void main (String[] args) throws Exception {
        byte[] bb;
        String s;

        // Test 1: UTF_32 BigEndian
        bb = getBytes(false, true);
        s = new String(bb, "UTF-32");
        testDecode("UTF_32", s, bb);
        testEncode("UTF_32", s, bb);

        // Test 2: UTF_32 LittleEndian Decoding With BOM and
        //         BigEndian Encoding
        bb = getBytes(true, false);
        s = new String(bb, "UTF-32");
        bb = getBytes(false, true);
        testDecode("UTF_32", s, bb);
        testEncode("UTF_32", s, bb);


        // Test 3: UTF_32BE
        bb = getBytes(false, true);
        s = new String(bb, "UTF-32BE");
        testDecode("UTF_32BE", s, bb);
        testEncode("UTF_32BE", s, bb);


        // Test 4: UTF_32LE
        bb = getBytes(false, false);
        s = new String(bb, "UTF-32LE");
        testDecode("UTF_32LE", s, bb);
        testEncode("UTF_32LE", s, bb);

        // Test 5: UTF_32BE_BOM
        bb = getBytes(true, true);
        s = new String(bb, "UTF-32BE-BOM");
        testDecode("UTF_32BE_BOM", s, bb);
        testEncode("UTF_32BE_BOM", s, bb);


        // Test 6: UTF_32LE_BOM
        bb = getBytes(true, false);
        s = new String(bb, "UTF-32LE-BOM");
        testDecode("UTF_32LE_BOM", s, bb);
        testEncode("UTF_32LE_BOM", s, bb);

        s = "\u4e00\ufffd\u4e01";
        // Test 7: BigEndian with reverse BOM in middle
        bb = new byte[] {
            (byte)0x00,(byte)0x00,(byte)0x4e,(byte)0x00,
            (byte)0xff,(byte)0xfe,(byte)0x00,(byte)0x00,
            (byte)0x00,(byte)0x00,(byte)0x4e,(byte)0x01
        };
        if (!s.equals(new String(bb, "UTF_32")) ||
            !s.equals(new String(bb, "UTF_32BE")) ||
            !s.equals(new String(bb, "UTF_32BE_BOM")))
            throw new Exception("UTF_32 Decoding test failed: ");

        // Test 7: LittleEndian with reverse BOM in middle
        bb = new byte[] {
            (byte)0xff,(byte)0xfe,(byte)0x00,(byte)0x00,
            (byte)0x00,(byte)0x4e,(byte)0x00,(byte)0x00,
            (byte)0x00,(byte)0x00,(byte)0xfe,(byte)0xff,
            (byte)0x01,(byte)0x4e,(byte)0x00,(byte)0x00
        };
        if (!s.equals(new String(bb, "UTF_32")) ||
            !s.equals(new String(bb, "UTF_32LE")) ||
            !s.equals(new String(bb, "UTF_32LE_BOM")))
            throw new Exception("UTF_32 Decoding test failed: ");

        // Test 8: Overflow
        if (CoderResult.OVERFLOW !=
            Charset.forName("UTF_32")
            .newDecoder()
            .decode((ByteBuffer.allocate(4)
                                 .put(new byte[]
                                      {(byte)0,(byte)1, (byte)0,(byte)01})
                                 .flip()),
                    CharBuffer.allocate(1),
                    true)) {
            throw new Exception ("Test UTF-32 Overflow test failed");
        }
        System.err.println ("OVERALL PASS OF UTF-32 Test");
    }
}