fe008ae27a
Reviewed-by: darcy, weijun
450 lines
15 KiB
Java
450 lines
15 KiB
Java
/*
|
|
* Copyright (c) 2008, Oracle and/or its affiliates. All rights reserved.
|
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
*
|
|
* This code is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU General Public License version 2 only, as
|
|
* published by the Free Software Foundation.
|
|
*
|
|
* This code is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
* version 2 for more details (a copy is included in the LICENSE file that
|
|
* accompanied this code).
|
|
*
|
|
* You should have received a copy of the GNU General Public License version
|
|
* 2 along with this work; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*
|
|
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
|
|
* or visit www.oracle.com if you need additional information or have any
|
|
* questions.
|
|
*/
|
|
|
|
/* @test
|
|
@bug 4779029 4924625 6392664 6730652
|
|
@summary Test decoding of various permutations of valid ISO-2022-CN byte sequences
|
|
*/
|
|
|
|
/*
|
|
* Regression test for NIO ISO-2022-CN decoder. Passes various valid
|
|
* ISO-2022-CN byte sequences to the decoder using the java.io
|
|
* InputStreamReader API
|
|
*/
|
|
|
|
import java.io.*;
|
|
import java.nio.*;
|
|
import java.nio.charset.*;
|
|
|
|
public class TestISO2022CNDecoder
|
|
{
|
|
private static String encodingName = "ISO2022CN";
|
|
|
|
//
|
|
// Positive tests -- test both output and input processing against
|
|
// various "known good" data
|
|
//
|
|
private static boolean decodeTest (
|
|
byte encoded[],
|
|
char decoded[],
|
|
String label)
|
|
{
|
|
boolean retval = true;
|
|
int i = 0;
|
|
|
|
try {
|
|
//
|
|
// Ensure that reading decodes correctly
|
|
//
|
|
ByteArrayInputStream in;
|
|
InputStreamReader reader;
|
|
|
|
in = new ByteArrayInputStream(encoded);
|
|
reader = new InputStreamReader(in, encodingName);
|
|
|
|
for (i = 0; i < decoded.length; i++) {
|
|
int c = reader.read();
|
|
|
|
if (c != decoded[i]) {
|
|
System.err.print(label + ": read failed, char " + i);
|
|
System.err.print(" ... expected 0x"
|
|
+ Integer.toHexString(decoded[i]));
|
|
if (c == -1)
|
|
System.err.println(", got EOF");
|
|
else
|
|
System.err.println(", got 0x"
|
|
+ Integer.toHexString(c));
|
|
retval = false;
|
|
if (c == -1)
|
|
return retval;
|
|
}
|
|
}
|
|
|
|
int testChar;
|
|
if ((testChar = reader.read()) != -1) {
|
|
System.err.println(label + ": read failed, no EOF");
|
|
System.err.println("testChar is " +
|
|
Integer.toHexString((int)testChar));
|
|
return false;
|
|
}
|
|
String decodedString = new String(encoded, "ISO2022CN");
|
|
|
|
for (i = 0; i < decodedString.length(); i++) {
|
|
if (decodedString.charAt(i) != decoded[i])
|
|
System.err.println(label + ": read failed, char " + i);
|
|
}
|
|
|
|
CharsetDecoder dec = Charset.forName("ISO2022CN")
|
|
.newDecoder()
|
|
.onUnmappableCharacter(CodingErrorAction.REPLACE)
|
|
.onMalformedInput(CodingErrorAction.REPLACE);
|
|
ByteBuffer bb = ByteBuffer.allocateDirect(encoded.length).put(encoded);
|
|
bb.flip();
|
|
CharBuffer cb = ByteBuffer.allocateDirect(2*encoded.length*(int)dec.maxCharsPerByte())
|
|
.asCharBuffer();
|
|
if (bb.hasArray() || cb.hasArray()) {
|
|
System.err.println(label + ": directBuffer failed, ");
|
|
return false;
|
|
}
|
|
if (!dec.decode(bb, cb, true).isUnderflow()) {
|
|
System.err.println(label + ": decoder's decode() failed!");
|
|
return false;
|
|
}
|
|
cb.flip();
|
|
for (i = 0; i < cb.limit(); i++) {
|
|
if (cb.get() != decoded[i])
|
|
System.err.println(label + ": decoder failed, char " + i);
|
|
}
|
|
|
|
} catch (Exception e) {
|
|
System.err.println(label + ": failed "
|
|
+ "(i = " + i + "), "
|
|
+ e.getClass().getName()
|
|
+ ", " + e.getMessage());
|
|
e.printStackTrace();
|
|
return false;
|
|
}
|
|
return retval;
|
|
}
|
|
|
|
private static boolean equal(CoderResult a, CoderResult b) {
|
|
return (a == CoderResult.OVERFLOW && b == CoderResult.OVERFLOW) ||
|
|
(a == CoderResult.UNDERFLOW && b == CoderResult.UNDERFLOW) ||
|
|
((a.isError() == b.isError()) &&
|
|
(a.isMalformed() == b.isMalformed()) &&
|
|
(a.isUnmappable() == b.isUnmappable()) &&
|
|
(a.length() == b.length()));
|
|
}
|
|
|
|
private static boolean decodeResultTest (byte encoded[],
|
|
CoderResult expected,
|
|
String label) {
|
|
CharsetDecoder dec = Charset.forName("ISO2022CN").newDecoder();
|
|
ByteBuffer bb = ByteBuffer.wrap(encoded);
|
|
CharBuffer cb = CharBuffer.allocate(encoded.length*(int)dec.maxCharsPerByte());
|
|
CoderResult result = dec.decode(bb, cb, true);
|
|
if (!equal(result, expected)) {
|
|
System.err.println(label + ": decoder's decode() failed!");
|
|
return false;
|
|
}
|
|
|
|
bb = ByteBuffer.allocateDirect(encoded.length).put(encoded);
|
|
bb.flip();
|
|
cb = ByteBuffer.allocateDirect(2*encoded.length*(int)dec.maxCharsPerByte())
|
|
.asCharBuffer();
|
|
if (bb.hasArray() || cb.hasArray()) {
|
|
System.err.println(label + ": directBuffer failed, ");
|
|
return false;
|
|
}
|
|
result = dec.reset().decode(bb, cb, true);
|
|
if (!equal(result, expected)) {
|
|
System.err.println(label + ": decoder's decode() - direct failed!");
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
//
|
|
// Negative tests -- only for input processing, make sure that
|
|
// invalid or corrupt characters are rejected.
|
|
//
|
|
private static boolean negative (byte encoded [], String label)
|
|
{
|
|
try {
|
|
ByteArrayInputStream in;
|
|
InputStreamReader reader;
|
|
int c;
|
|
|
|
in = new ByteArrayInputStream(encoded);
|
|
reader = new InputStreamReader(in, encodingName);
|
|
|
|
c = reader.read();
|
|
System.err.print (label + ": read failed, ");
|
|
|
|
if (c == -1)
|
|
System.err.println("reported EOF");
|
|
else
|
|
System.err.println("returned char 0x"
|
|
+ Integer.toHexString(c)
|
|
+ ", expected exception");
|
|
return false;
|
|
|
|
} catch (CharConversionException e) {
|
|
return true;
|
|
|
|
} catch (Throwable t) {
|
|
System.err.println(label + ": failed, threw "
|
|
+ t.getClass().getName()
|
|
+ ", " + t.getMessage());
|
|
}
|
|
return false;
|
|
}
|
|
|
|
private static boolean decodeTest6392664 () {
|
|
try {
|
|
CharsetDecoder dec = Charset.forName("ISO-2022-CN-GB").newDecoder();
|
|
dec.decode(ByteBuffer.wrap(new byte[] {(byte)0x0e, (byte)0x42, (byte)0x43 }));
|
|
} catch (Exception e) {
|
|
e.printStackTrace();
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
//
|
|
// TEST #0: 7-bit unshifted values,
|
|
// shift-in of a valid decodable GB2312-80
|
|
// character and an unmappable GB2312-80 char
|
|
// This is a positive test.
|
|
//
|
|
private static byte test0_bytes[] = {
|
|
(byte)0x00,
|
|
(byte)0x01, (byte)0x02, (byte)0x03,
|
|
(byte)0x0E, (byte)0x21, (byte)0x2f,
|
|
(byte)0x0E, (byte)0xDD, (byte)0x9f
|
|
};
|
|
|
|
private static char test0_chars[] = {
|
|
0x0000,
|
|
0x0001, 0x0002, 0x0003,
|
|
0x2019,
|
|
0xFFFD
|
|
};
|
|
|
|
private static byte test1_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, (byte)0x21,
|
|
(byte)0x2f };
|
|
|
|
private static char test1_chars[] = {
|
|
0x21, 0x2f
|
|
};
|
|
|
|
private static byte test2_bytes[] = {
|
|
(byte)0x0e,
|
|
(byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41,
|
|
(byte)0x21, (byte)0x2f };
|
|
|
|
private static char test2_chars[] = {
|
|
0x2019
|
|
};
|
|
|
|
private static byte test3_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41,
|
|
(byte)0x0e,
|
|
(byte)0x21, (byte)0x2f };
|
|
|
|
private static byte test3a_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x41,
|
|
(byte)0x0e,
|
|
(byte)0x21, (byte)0x2f };
|
|
|
|
private static char test3_chars[] = {
|
|
0x2019
|
|
};
|
|
|
|
private static byte test4_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41,
|
|
(byte)0x0f,
|
|
(byte)0x21, (byte)0x2f };
|
|
|
|
private static char test4_chars[] = {
|
|
0x21, 0x2f
|
|
};
|
|
|
|
private static byte test5_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41,
|
|
(byte)0x0e, (byte)0x21, (byte)0x2e,
|
|
(byte)0x0f, (byte)0x21, (byte)0x2f };
|
|
|
|
private static char test5_chars[] = {
|
|
0x2018, 0x21, 0x2f
|
|
};
|
|
|
|
private static byte test6_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41,
|
|
(byte)0x0e, (byte)0x21, (byte)0x2e,
|
|
(byte)0x21, (byte)0x2f };
|
|
|
|
private static char test6_chars[] = {
|
|
0x2018, 0x2019
|
|
};
|
|
|
|
private static byte test7_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x29, (byte)'G',
|
|
(byte)0x0e, (byte)0x21, (byte)0x2e,
|
|
(byte)0x21, (byte)0x2f };
|
|
|
|
private static char test7_chars[] = {
|
|
0xFE50, 0xFE51
|
|
};
|
|
|
|
private static byte test8_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x29, (byte)'G',
|
|
(byte)0x0e, (byte)0x21, (byte)0x2e,
|
|
(byte)0x0f, (byte)0x21, (byte)0x2f };
|
|
|
|
private static char test8_chars[] = {
|
|
0xFE50, 0x21, 0x2f
|
|
};
|
|
|
|
private static byte test9_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x2a, (byte)'H',
|
|
(byte)0x1b, (byte)0x4e,
|
|
(byte)0x21, (byte)0x2f };
|
|
|
|
private static char test9_chars[] = {
|
|
0x4e0e
|
|
};
|
|
|
|
/*
|
|
* Plane 3 support provided for compatibility with
|
|
* sun.io ISO2022_CN decoder. Officially ISO-2022-CN
|
|
* just handles planes 1/2 of CNS-11643 (1986)
|
|
* Test case data below verifies this compatibility
|
|
*
|
|
*/
|
|
|
|
private static byte test10_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)'+', (byte)'I',
|
|
(byte)0x1b, (byte)0x4f,
|
|
(byte)0x21, (byte)0x2f };
|
|
|
|
private static char test10_chars[] = {
|
|
0x51e2
|
|
};
|
|
|
|
private static byte test11_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, //SO Designator
|
|
(byte)0x0e, //SO
|
|
(byte)0x21, (byte)0x2e, //GB2312 char
|
|
(byte)0x1b, (byte)0x24, (byte)0x2a, (byte)'H', //SS2 Designator
|
|
(byte)0x1b, (byte)0x4e, //SS2
|
|
(byte)0x21, (byte)0x2f, //CNS-P2 char
|
|
(byte)0x21, (byte)0x2f //GB2312 char
|
|
};
|
|
|
|
private static char test11_chars[] = {
|
|
0x2018,
|
|
0x4e0e,
|
|
0x2019
|
|
};
|
|
|
|
private static byte test12_bytes[] = {
|
|
(byte)0x1b, (byte)0x24, (byte)0x29, (byte)0x41, //SO Designator
|
|
(byte)0x0e, //SO
|
|
(byte)0x21, (byte)0x2e, //GB2312 char
|
|
(byte)0x1b, (byte)0x24, (byte)'+', (byte)'I', //SS3 Designator
|
|
(byte)0x1b, (byte)0x4f, //SS3
|
|
(byte)0x21, (byte)0x2f, //CNS-P2 char
|
|
(byte)0x21, (byte)0x2f //GB2312 char
|
|
};
|
|
|
|
private static char test12_chars[] = {
|
|
0x2018,
|
|
0x51e2,
|
|
0x2019
|
|
};
|
|
|
|
|
|
private static byte test13_bytes[] = {
|
|
(byte)0x0f0, // byte with MSB
|
|
};
|
|
|
|
private static char test13_chars[] = {
|
|
0x00f0,
|
|
};
|
|
|
|
private static byte test14_bytes[] = {
|
|
(byte)0x0E, (byte)0x21, (byte)0x2f,
|
|
(byte)0x0E, (byte)0xDD, (byte)0x9f
|
|
};
|
|
private static CoderResult test14_result = CoderResult.unmappableForLength(2);
|
|
|
|
// Current ISO2022CN treats the "out of range" code points as "unmappable"
|
|
private static byte test15_bytes[] = {
|
|
(byte)0x1b, (byte)0x4f, // SS3
|
|
(byte)0x20, (byte)0x2f, // "out of range" CNS-P2 char
|
|
};
|
|
private static CoderResult test15_result = CoderResult.unmappableForLength(4);
|
|
|
|
private static boolean encodeTest6730652 () throws Exception {
|
|
//sample p3 codepoints
|
|
String strCNSP3 = "\u4e28\u4e36\u4e3f\u4e85\u4e05\u4e04\u5369\u53b6\u4e2a\u4e87\u4e49\u51e2\u56b8\u56b9\u56c4\u8053\u92b0";
|
|
return strCNSP3.equals(new String(strCNSP3.getBytes("x-ISO-2022-CN-CNS"), "x-ISO-2022-CN-CNS"));
|
|
}
|
|
|
|
/**
|
|
* Main program to test ISO2022CN conformance
|
|
*
|
|
*/
|
|
public static void main (String argv []) throws Exception
|
|
{
|
|
boolean pass = true;
|
|
|
|
System.out.println ("");
|
|
System.out.println ("------ checking ISO2022CN decoder -----");
|
|
|
|
// This regtest must be the first one.
|
|
pass &= decodeTest6392664();
|
|
|
|
try {
|
|
new InputStreamReader (System.in, "ISO2022CN");
|
|
} catch (Exception e) {
|
|
encodingName = "ISO2022CN";
|
|
System.out.println ("... requires nonstandard encoding name "
|
|
+ encodingName);
|
|
pass &= false;
|
|
}
|
|
|
|
//
|
|
// Positive tests -- good data is dealt with correctly
|
|
//
|
|
pass &= decodeTest(test0_bytes, test0_chars, "first batch");
|
|
pass &= decodeTest(test1_bytes, test1_chars, "escapes1");
|
|
pass &= decodeTest(test2_bytes, test2_chars, "escapes2");
|
|
pass &= decodeTest(test3_bytes, test3_chars, "escapes3");
|
|
pass &= decodeTest(test3a_bytes, test3_chars, "escapes3a");
|
|
pass &= decodeTest(test4_bytes, test4_chars, "escapes4");
|
|
pass &= decodeTest(test5_bytes, test5_chars, "escapes5");
|
|
pass &= decodeTest(test6_bytes, test6_chars, "escapes6");
|
|
pass &= decodeTest(test7_bytes, test7_chars, "escapes7");
|
|
pass &= decodeTest(test8_bytes, test8_chars, "escapes8");
|
|
pass &= decodeTest(test9_bytes, test9_chars, "escapes9");
|
|
pass &= decodeTest(test10_bytes, test10_chars, "escapes10");
|
|
pass &= decodeTest(test11_bytes, test11_chars, "escapes11");
|
|
pass &= decodeTest(test12_bytes, test12_chars, "escapes12");
|
|
pass &= decodeTest(test13_bytes, test13_chars, "escapes13");
|
|
pass &= decodeResultTest(test14_bytes, test14_result, "escapes14");
|
|
pass &= decodeResultTest(test15_bytes, test15_result, "escapes15");
|
|
|
|
pass &= encodeTest6730652 ();
|
|
|
|
// PASS/FAIL status is what the whole thing is about.
|
|
//
|
|
if (! pass) {
|
|
throw new Exception("FAIL -- incorrect ISO-2022-CN");
|
|
}
|
|
|
|
}
|
|
}
|