/* * Copyright 2008 Sun Microsystems, Inc. All Rights Reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara, * CA 95054 USA or visit www.sun.com if you need additional information or * have any questions. */ /* @bug 6346419 @summary Check correctness of the UTF-32 and its variant charsets */ import java.io.*; import java.nio.*; import java.nio.charset.*; public class TestUTF_32 { private static void testDecode(String charset, String expected, byte[] input) throws Exception { String out = new String(input, charset); if (!out.equals(expected)) { failureReport (out, expected); throw new Exception("UTF_32 Decoding test failed: " + charset); } } private static void testEncode(String charset, String input, byte[] expected) throws Exception { byte[] testBytes = input.getBytes(charset); for (int i = 0; i< expected.length; i++) if (testBytes[i] != expected[i]) throw new Exception("UTF_32 Encoding test failed: [" + i + "]"+ charset); } private static void warn(String s) { System.err.println("FAILED Test UTF-32:" + s) ; } private static void failureReport(String testStr, String expected) { System.err.println ("Expected Characters:"); for (int i = 0; i < expected.length() ; i++) { warn("expected char[" + i + "] : " + Integer.toHexString((int)expected.charAt(i)) + "obtained char[" + i + "] : " + Integer.toHexString((int)testStr.charAt(i))); } } private static void writeInt(OutputStream os, int i, boolean isBig) throws Exception { if (isBig) { os.write((i>>24) & 0xff); os.write((i>>16) & 0xff); os.write((i>>8) & 0xff); os.write(i & 0xff); } else { os.write(i & 0xff); os.write((i>>8) & 0xff); os.write((i>>16) & 0xff); os.write((i>>24) & 0xff); } } private static byte[] getBytes(boolean doBOM, boolean isBig) throws Exception { ByteArrayOutputStream baos = new ByteArrayOutputStream(1024*1024); if (doBOM) writeInt(baos, 0xfeff, isBig); for (int i = 0; i < 0xffff; i++) { if (i < Character.MIN_SURROGATE || i > Character.MAX_SURROGATE) writeInt(baos, i, isBig); } for (int i = 0x10000; i < 0x1ffff; i++) { writeInt(baos, i, isBig); } for (int i = 0x100000; i < 0x10ffff; i++) { writeInt(baos, i, isBig); } byte[] bb = baos.toByteArray(); baos.close(); return bb; } public static void main (String[] args) throws Exception { byte[] bb; String s; // Test 1: UTF_32 BigEndian bb = getBytes(false, true); s = new String(bb, "UTF-32"); testDecode("UTF_32", s, bb); testEncode("UTF_32", s, bb); // Test 2: UTF_32 LittleEndian Decoding With BOM and // BigEndian Encoding bb = getBytes(true, false); s = new String(bb, "UTF-32"); bb = getBytes(false, true); testDecode("UTF_32", s, bb); testEncode("UTF_32", s, bb); // Test 3: UTF_32BE bb = getBytes(false, true); s = new String(bb, "UTF-32BE"); testDecode("UTF_32BE", s, bb); testEncode("UTF_32BE", s, bb); // Test 4: UTF_32LE bb = getBytes(false, false); s = new String(bb, "UTF-32LE"); testDecode("UTF_32LE", s, bb); testEncode("UTF_32LE", s, bb); // Test 5: UTF_32BE_BOM bb = getBytes(true, true); s = new String(bb, "UTF-32BE-BOM"); testDecode("UTF_32BE_BOM", s, bb); testEncode("UTF_32BE_BOM", s, bb); // Test 6: UTF_32LE_BOM bb = getBytes(true, false); s = new String(bb, "UTF-32LE-BOM"); testDecode("UTF_32LE_BOM", s, bb); testEncode("UTF_32LE_BOM", s, bb); s = "\u4e00\ufffd\u4e01"; // Test 7: BigEndian with reverse BOM in middle bb = new byte[] { (byte)0x00,(byte)0x00,(byte)0x4e,(byte)0x00, (byte)0xff,(byte)0xfe,(byte)0x00,(byte)0x00, (byte)0x00,(byte)0x00,(byte)0x4e,(byte)0x01 }; if (!s.equals(new String(bb, "UTF_32")) || !s.equals(new String(bb, "UTF_32BE")) || !s.equals(new String(bb, "UTF_32BE_BOM"))) throw new Exception("UTF_32 Decoding test failed: "); // Test 7: LittleEndian with reverse BOM in middle bb = new byte[] { (byte)0xff,(byte)0xfe,(byte)0x00,(byte)0x00, (byte)0x00,(byte)0x4e,(byte)0x00,(byte)0x00, (byte)0x00,(byte)0x00,(byte)0xfe,(byte)0xff, (byte)0x01,(byte)0x4e,(byte)0x00,(byte)0x00 }; if (!s.equals(new String(bb, "UTF_32")) || !s.equals(new String(bb, "UTF_32LE")) || !s.equals(new String(bb, "UTF_32LE_BOM"))) throw new Exception("UTF_32 Decoding test failed: "); // Test 8: Overflow if (CoderResult.OVERFLOW != Charset.forName("UTF_32") .newDecoder() .decode((ByteBuffer)(ByteBuffer.allocate(4) .put(new byte[] {(byte)0,(byte)1, (byte)0,(byte)01}) .flip()), CharBuffer.allocate(1), true)) { throw new Exception ("Test UTF-32 Overflow test failed"); } System.err.println ("OVERALL PASS OF UTF-32 Test"); } }