aa384aeaaf
Reviewed-by: martin
154 lines
6.6 KiB
Java
154 lines
6.6 KiB
Java
/*
|
|
* Copyright (c) 2002, 2013, Oracle and/or its affiliates. All rights reserved.
|
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
*
|
|
* This code is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU General Public License version 2 only, as
|
|
* published by the Free Software Foundation.
|
|
*
|
|
* This code is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
* version 2 for more details (a copy is included in the LICENSE file that
|
|
* accompanied this code).
|
|
*
|
|
* You should have received a copy of the GNU General Public License version
|
|
* 2 along with this work; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*
|
|
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
|
|
* or visit www.oracle.com if you need additional information or have any
|
|
* questions.
|
|
*/
|
|
|
|
/* @test
|
|
* @bug 4153987
|
|
* @summary Malformed surrogates should be handled by the converter in
|
|
* substitution mode.
|
|
*/
|
|
import java.io.*;
|
|
import java.nio.charset.Charset;
|
|
import java.nio.charset.CharsetDecoder;
|
|
import java.nio.charset.CharsetEncoder;
|
|
import java.nio.CharBuffer;
|
|
import java.nio.ByteBuffer;
|
|
import java.nio.charset.CodingErrorAction;
|
|
import java.nio.charset.MalformedInputException;
|
|
import java.nio.charset.UnmappableCharacterException;
|
|
import java.util.SortedMap;
|
|
|
|
public class MalformedSurrogates {
|
|
|
|
private static final String PREFIX = "abc";
|
|
private static final String SUFFIX = "efgh";
|
|
private static final String MALFORMED_SURROGATE = PREFIX + "\uD800\uDB00" + SUFFIX;
|
|
private static final String NORMAL_SURROGATE = PREFIX + "\uD800\uDC00" + SUFFIX;
|
|
private static final String REVERSED_SURROGATE = PREFIX + "\uDC00\uD800" + SUFFIX;
|
|
private static final String SOLITARY_HIGH_SURROGATE = PREFIX + "\uD800" + SUFFIX;
|
|
private static final String SOLITARY_LOW_SURROGATE = PREFIX + "\uDC00" + SUFFIX;
|
|
|
|
public static void main(String[] args) throws IOException {
|
|
SortedMap<String, Charset> map = Charset.availableCharsets();
|
|
for (String name : map.keySet()) {
|
|
Charset charset = map.get(name);
|
|
if (charset.canEncode() && !charset.name().equals("x-COMPOUND_TEXT")) {
|
|
testNormalSurrogate(charset, NORMAL_SURROGATE);
|
|
testMalformedSurrogate(charset, MALFORMED_SURROGATE);
|
|
testMalformedSurrogate(charset, REVERSED_SURROGATE);
|
|
testMalformedSurrogate(charset, SOLITARY_HIGH_SURROGATE);
|
|
testMalformedSurrogate(charset, SOLITARY_LOW_SURROGATE);
|
|
testSurrogateWithReplacement(charset, NORMAL_SURROGATE);
|
|
testSurrogateWithReplacement(charset, MALFORMED_SURROGATE);
|
|
testSurrogateWithReplacement(charset, REVERSED_SURROGATE);
|
|
testSurrogateWithReplacement(charset, SOLITARY_HIGH_SURROGATE);
|
|
testSurrogateWithReplacement(charset, SOLITARY_LOW_SURROGATE);
|
|
}
|
|
}
|
|
}
|
|
|
|
public static void testMalformedSurrogate(Charset cs, String surrogate) throws IOException {
|
|
CharsetEncoder en = cs.newEncoder();
|
|
if (en.canEncode(surrogate)) {
|
|
throw new RuntimeException("testMalformedSurrogate failed with charset " + cs.name());
|
|
}
|
|
|
|
try {
|
|
en.encode(CharBuffer.wrap(surrogate));
|
|
throw new RuntimeException("Should throw MalformedInputException or UnmappableCharacterException");
|
|
} catch (MalformedInputException | UnmappableCharacterException ex) {
|
|
} finally {
|
|
en.reset();
|
|
}
|
|
|
|
try (OutputStreamWriter osw = new OutputStreamWriter(new ByteArrayOutputStream(), en)) {
|
|
osw.write(surrogate);
|
|
throw new RuntimeException("Should throw MalformedInputException or UnmappableCharacterException");
|
|
} catch (MalformedInputException | UnmappableCharacterException ex) {
|
|
}
|
|
}
|
|
|
|
public static void testNormalSurrogate(Charset cs, String surrogate) throws IOException {
|
|
CharsetEncoder en = cs.newEncoder();
|
|
try {
|
|
en.encode(CharBuffer.wrap(surrogate));
|
|
} catch (UnmappableCharacterException ex) {
|
|
} finally {
|
|
en.reset();
|
|
}
|
|
|
|
try (OutputStreamWriter osw = new OutputStreamWriter(new ByteArrayOutputStream(), en)) {
|
|
osw.write(surrogate);
|
|
} catch (UnmappableCharacterException ex) {
|
|
}
|
|
}
|
|
|
|
public static void testSurrogateWithReplacement(Charset cs, String surrogate) throws IOException {
|
|
CharsetEncoder en = cs.newEncoder();
|
|
CharsetDecoder de = cs.newDecoder();
|
|
if (!en.canEncode(NORMAL_SURROGATE)) {
|
|
return;
|
|
}
|
|
String expected = null;
|
|
String replace = new String(en.replacement(), cs);
|
|
switch (surrogate) {
|
|
case MALFORMED_SURROGATE:
|
|
case REVERSED_SURROGATE:
|
|
expected = PREFIX + replace + replace + SUFFIX;
|
|
break;
|
|
case SOLITARY_HIGH_SURROGATE:
|
|
case SOLITARY_LOW_SURROGATE:
|
|
expected = PREFIX + replace + SUFFIX;
|
|
break;
|
|
default:
|
|
expected = NORMAL_SURROGATE;
|
|
}
|
|
|
|
try {
|
|
en.onMalformedInput(CodingErrorAction.REPLACE);
|
|
en.onUnmappableCharacter(CodingErrorAction.REPLACE);
|
|
ByteBuffer bbuf = en.encode(CharBuffer.wrap(surrogate));
|
|
CharBuffer cbuf = de.decode(bbuf);
|
|
if (!cbuf.toString().equals(expected)) {
|
|
throw new RuntimeException("charset " + cs.name() + " (en)decoded the surrogate " + surrogate + " to " + cbuf.toString() + " which is not same as the expected " + expected);
|
|
}
|
|
} finally {
|
|
en.reset();
|
|
de.reset();
|
|
}
|
|
|
|
try (ByteArrayOutputStream bos = new ByteArrayOutputStream();
|
|
OutputStreamWriter osw = new OutputStreamWriter(bos, en);) {
|
|
osw.write(surrogate);
|
|
osw.flush();
|
|
try (InputStreamReader isr = new InputStreamReader(new ByteArrayInputStream(bos.toByteArray()), de)) {
|
|
CharBuffer cbuf = CharBuffer.allocate(expected.length());
|
|
isr.read(cbuf);
|
|
cbuf.rewind();
|
|
if (!cbuf.toString().equals(expected)) {
|
|
throw new RuntimeException("charset " + cs.name() + " (en)decoded the surrogate " + surrogate + " to " + cbuf.toString() + " which is not same as the expected " + expected);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|