/* * Copyright 2008 Sun Microsystems, Inc. All Rights Reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara, * CA 95054 USA or visit www.sun.com if you need additional information or * have any questions. */ /* @test @bug 4779029 4924625 6392664 6730652 @summary Test decoding of various permutations of valid ISO-2022-CN byte sequences */ /* * Regression test for NIO ISO-2022-CN decoder. Passes various valid * ISO-2022-CN byte sequences to the decoder using the java.io * InputStreamReader API */ import java.io.*; import java.nio.*; import java.nio.charset.*; public class TestISO2022CNDecoder { private static String encodingName = "ISO2022CN"; // // Positive tests -- test both output and input processing against // various "known good" data // private static boolean decodeTest ( byte encoded[], char decoded[], String label) { boolean retval = true; int i = 0; try { // // Ensure that reading decodes correctly // ByteArrayInputStream in; InputStreamReader reader; in = new ByteArrayInputStream(encoded); reader = new InputStreamReader(in, encodingName); for (i = 0; i < decoded.length; i++) { int c = reader.read(); if (c != decoded[i]) { System.err.print(label + ": read failed, char " + i); System.err.print(" ... expected 0x" + Integer.toHexString(decoded[i])); if (c == -1) System.err.println(", got EOF"); else System.err.println(", got 0x" + Integer.toHexString(c)); retval = false; if (c == -1) return retval; } } int testChar; if ((testChar = reader.read()) != -1) { System.err.println(label + ": read failed, no EOF"); System.err.println("testChar is " + Integer.toHexString((int)testChar)); return false; } String decodedString = new String(encoded, "ISO2022CN"); for (i = 0; i < decodedString.length(); i++) { if (decodedString.charAt(i) != decoded[i]) System.err.println(label + ": read failed, char " + i); } CharsetDecoder dec = Charset.forName("ISO2022CN") .newDecoder() .onUnmappableCharacter(CodingErrorAction.REPLACE) .onMalformedInput(CodingErrorAction.REPLACE); ByteBuffer bb = ByteBuffer.allocateDirect(encoded.length).put(encoded); bb.flip(); CharBuffer cb = ByteBuffer.allocateDirect(2*encoded.length*(int)dec.maxCharsPerByte()) .asCharBuffer(); if (bb.hasArray() || cb.hasArray()) { System.err.println(label + ": directBuffer failed, "); return false; } if (!dec.decode(bb, cb, true).isUnderflow()) { System.err.println(label + ": decoder's decode() failed!"); return false; } cb.flip(); for (i = 0; i < cb.limit(); i++) { if (cb.get() != decoded[i]) System.err.println(label + ": decoder failed, char " + i); } } catch (Exception e) { System.err.println(label + ": failed " + "(i = " + i + "), " + e.getClass().getName() + ", " + e.getMessage()); e.printStackTrace(); return false; } return retval; } private static boolean equal(CoderResult a, CoderResult b) { return (a == CoderResult.OVERFLOW && b == CoderResult.OVERFLOW) || (a == CoderResult.UNDERFLOW && b == CoderResult.UNDERFLOW) || ((a.isError() == b.isError()) && (a.isMalformed() == b.isMalformed()) && (a.isUnmappable() == b.isUnmappable()) && (a.length() == b.length())); } private static boolean decodeResultTest (byte encoded[], CoderResult expected, String label) { CharsetDecoder dec = Charset.forName("ISO2022CN").newDecoder(); ByteBuffer bb = ByteBuffer.wrap(encoded); CharBuffer cb = CharBuffer.allocate(encoded.length*(int)dec.maxCharsPerByte()); CoderResult result = dec.decode(bb, cb, true); if (!equal(result, expected)) { System.err.println(label + ": decoder's decode() failed!"); return false; } bb = ByteBuffer.allocateDirect(encoded.length).put(encoded); bb.flip(); cb = ByteBuffer.allocateDirect(2*encoded.length*(int)dec.maxCharsPerByte()) .asCharBuffer(); if (bb.hasArray() || cb.hasArray()) { System.err.println(label + ": directBuffer failed, "); return false; } result = dec.reset().decode(bb, cb, true); if (!equal(result, expected)) { System.err.println(label + ": decoder's decode() - direct failed!"); return false; } return true; } // // Negative tests -- only for input processing, make sure that // invalid or corrupt characters are rejected. // private static boolean negative (byte encoded [], String label) { try { ByteArrayInputStream in; InputStreamReader reader; int c; in = new ByteArrayInputStream(encoded); reader = new InputStreamReader(in, encodingName); c = reader.read(); System.err.print (label + ": read failed, "); if (c == -1) System.err.println("reported EOF"); else System.err.println("returned char 0x" + Integer.toHexString(c) + ", expected exception"); return false; } catch (CharConversionException e) { return true; } catch (Throwable t) { System.err.println(label + ": failed, threw " + t.getClass().getName() + ", " + t.getMessage()); } return false; } private static boolean decodeTest6392664 () { try { CharsetDecoder dec = Charset.forName("ISO-2022-CN-GB").newDecoder(); dec.decode(ByteBuffer.wrap(new byte[] {(byte)0x0e, (byte)0x42, (byte)0x43 })); } catch (Exception e) { e.printStackTrace(); return false; } return true; } // // TEST #0: 7-bit unshifted values, // shift-in of a valid decodable GB2312-80 // character and an unmappable GB2312-80 char // This is a positive test. // private static byte test0_bytes[] = { (byte)0x00, (byte)0x01, (byte)0x02, (byte)0x03, (byte)0x0E, (byte)0x21, (byte)0x2f, (byte)0x0E, (byte)0xDD, (byte)0x9f }; private static char test0_chars[] = { 0x0000, 0x0001, 0x0002, 0x0003, 0x2019, 0xFFFD }; private static byte test1_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, (byte)0x21, (byte)0x2f }; private static char test1_chars[] = { 0x21, 0x2f }; private static byte test2_bytes[] = { (byte)0x0e, (byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, (byte)0x21, (byte)0x2f }; private static char test2_chars[] = { 0x2019 }; private static byte test3_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, (byte)0x0e, (byte)0x21, (byte)0x2f }; private static byte test3a_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x41, (byte)0x0e, (byte)0x21, (byte)0x2f }; private static char test3_chars[] = { 0x2019 }; private static byte test4_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, (byte)0x0f, (byte)0x21, (byte)0x2f }; private static char test4_chars[] = { 0x21, 0x2f }; private static byte test5_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, (byte)0x0e, (byte)0x21, (byte)0x2e, (byte)0x0f, (byte)0x21, (byte)0x2f }; private static char test5_chars[] = { 0x2018, 0x21, 0x2f }; private static byte test6_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, (byte)0x0e, (byte)0x21, (byte)0x2e, (byte)0x21, (byte)0x2f }; private static char test6_chars[] = { 0x2018, 0x2019 }; private static byte test7_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x29, (byte)'G', (byte)0x0e, (byte)0x21, (byte)0x2e, (byte)0x21, (byte)0x2f }; private static char test7_chars[] = { 0xFE50, 0xFE51 }; private static byte test8_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x29, (byte)'G', (byte)0x0e, (byte)0x21, (byte)0x2e, (byte)0x0f, (byte)0x21, (byte)0x2f }; private static char test8_chars[] = { 0xFE50, 0x21, 0x2f }; private static byte test9_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x2a, (byte)'H', (byte)0x1b, (byte)0x4e, (byte)0x21, (byte)0x2f }; private static char test9_chars[] = { 0x4e0e }; /* * Plane 3 support provided for compatibility with * sun.io ISO2022_CN decoder. Officially ISO-2022-CN * just handles planes 1/2 of CNS-11643 (1986) * Test case data below verifies this compatibility * */ private static byte test10_bytes[] = { (byte)0x1b, (byte)0x24, (byte)'+', (byte)'I', (byte)0x1b, (byte)0x4f, (byte)0x21, (byte)0x2f }; private static char test10_chars[] = { 0x51e2 }; private static byte test11_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, //SO Designator (byte)0x0e, //SO (byte)0x21, (byte)0x2e, //GB2312 char (byte)0x1b, (byte)0x24, (byte)0x2a, (byte)'H', //SS2 Designator (byte)0x1b, (byte)0x4e, //SS2 (byte)0x21, (byte)0x2f, //CNS-P2 char (byte)0x21, (byte)0x2f //GB2312 char }; private static char test11_chars[] = { 0x2018, 0x4e0e, 0x2019 }; private static byte test12_bytes[] = { (byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, //SO Designator (byte)0x0e, //SO (byte)0x21, (byte)0x2e, //GB2312 char (byte)0x1b, (byte)0x24, (byte)'+', (byte)'I', //SS3 Designator (byte)0x1b, (byte)0x4f, //SS3 (byte)0x21, (byte)0x2f, //CNS-P2 char (byte)0x21, (byte)0x2f //GB2312 char }; private static char test12_chars[] = { 0x2018, 0x51e2, 0x2019 }; private static byte test13_bytes[] = { (byte)0x0f0, // byte with MSB }; private static char test13_chars[] = { 0x00f0, }; private static byte test14_bytes[] = { (byte)0x0E, (byte)0x21, (byte)0x2f, (byte)0x0E, (byte)0xDD, (byte)0x9f }; private static CoderResult test14_result = CoderResult.unmappableForLength(2); // Current ISO2022CN treats the "out of range" code points as "unmappable" private static byte test15_bytes[] = { (byte)0x1b, (byte)0x4f, // SS3 (byte)0x20, (byte)0x2f, // "out of range" CNS-P2 char }; private static CoderResult test15_result = CoderResult.unmappableForLength(4); private static boolean encodeTest6730652 () throws Exception { //sample p3 codepoints String strCNSP3 = "\u4e28\u4e36\u4e3f\u4e85\u4e05\u4e04\u5369\u53b6\u4e2a\u4e87\u4e49\u51e2\u56b8\u56b9\u56c4\u8053\u92b0"; return strCNSP3.equals(new String(strCNSP3.getBytes("x-ISO-2022-CN-CNS"), "x-ISO-2022-CN-CNS")); } /** * Main program to test ISO2022CN conformance * */ public static void main (String argv []) throws Exception { boolean pass = true; System.out.println (""); System.out.println ("------ checking ISO2022CN decoder -----"); // This regtest must be the first one. pass &= decodeTest6392664(); try { new InputStreamReader (System.in, "ISO2022CN"); } catch (Exception e) { encodingName = "ISO2022CN"; System.out.println ("... requires nonstandard encoding name " + encodingName); pass &= false; } // // Positive tests -- good data is dealt with correctly // pass &= decodeTest(test0_bytes, test0_chars, "first batch"); pass &= decodeTest(test1_bytes, test1_chars, "escapes1"); pass &= decodeTest(test2_bytes, test2_chars, "escapes2"); pass &= decodeTest(test3_bytes, test3_chars, "escapes3"); pass &= decodeTest(test3a_bytes, test3_chars, "escapes3a"); pass &= decodeTest(test4_bytes, test4_chars, "escapes4"); pass &= decodeTest(test5_bytes, test5_chars, "escapes5"); pass &= decodeTest(test6_bytes, test6_chars, "escapes6"); pass &= decodeTest(test7_bytes, test7_chars, "escapes7"); pass &= decodeTest(test8_bytes, test8_chars, "escapes8"); pass &= decodeTest(test9_bytes, test9_chars, "escapes9"); pass &= decodeTest(test10_bytes, test10_chars, "escapes10"); pass &= decodeTest(test11_bytes, test11_chars, "escapes11"); pass &= decodeTest(test12_bytes, test12_chars, "escapes12"); pass &= decodeTest(test13_bytes, test13_chars, "escapes13"); pass &= decodeResultTest(test14_bytes, test14_result, "escapes14"); pass &= decodeResultTest(test15_bytes, test15_result, "escapes15"); pass &= encodeTest6730652 (); // PASS/FAIL status is what the whole thing is about. // if (! pass) { throw new Exception("FAIL -- incorrect ISO-2022-CN"); } } }