211 lines
7.5 KiB
Java
Raw Normal View History

/*
* Copyright (c) 2010, 2023, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*/
/* @test
* @summary Unit test for charset containment
* @bug 6798572 8167252
* @modules jdk.charsets
* @run junit Contains
*/
import java.nio.charset.Charset;
import java.util.Arrays;
import java.util.stream.Stream;
import org.junit.jupiter.api.Test;
import org.junit.jupiter.params.ParameterizedTest;
import org.junit.jupiter.params.provider.Arguments;
import org.junit.jupiter.params.provider.MethodSource;
import static org.junit.jupiter.api.Assertions.assertEquals;
import static org.junit.jupiter.api.Assertions.assertTrue;
public class Contains {
/**
* Tests the containment of some charsets against themselves.
* This test takes both true and false for 'cont'.
*/
@ParameterizedTest
@MethodSource("charsets")
public void charsetsTest(Charset containerCs, Charset cs, boolean cont){
shouldContain(containerCs, cs, cont);
}
/**
* Tests UTF charsets with other charsets. In this case, each UTF charset
* should contain every single charset they are tested against. 'cont' is
* always true.
*/
@ParameterizedTest
@MethodSource("utfCharsets")
public void UTFCharsetsTest(Charset containerCs, Charset cs, boolean cont){
shouldContain(containerCs, cs, cont);
}
/**
* Tests the assertion in the contains() method: "Every charset contains itself."
*/
@Test
public void containsSelfTest() {
for (var entry : Charset.availableCharsets().entrySet()) {
Charset charset = entry.getValue();
boolean contains = charset.contains(charset);
assertTrue(contains, String.format("Charset(%s).contains(Charset(%s)) returns %s",
charset.name(), charset.name(), contains));
}
}
/**
* Helper method that checks if a charset should contain another charset.
*/
static void shouldContain(Charset containerCs, Charset cs, boolean cont){
assertEquals((containerCs.contains(cs)), cont, String.format("%s %s %s",
containerCs.name(), (cont ? " contains " : " does not contain "), cs.name()));
}
private static Stream<Arguments> utfCharsets() {
String[] utfNames = {
"utf-16",
"utf-8",
"utf-16le",
"utf-16be",
"x-utf-16le-bom"
};
String[] charsetNames = {
"US-ASCII",
"UTF-8",
"UTF-16",
"UTF-16BE",
"UTF-16LE",
"x-UTF-16LE-BOM",
"GBK",
"GB18030",
"ISO-8859-1",
"ISO-8859-15",
"ISO-8859-2",
"ISO-8859-3",
"ISO-8859-4",
"ISO-8859-5",
"ISO-8859-6",
"ISO-8859-7",
"ISO-8859-8",
"ISO-8859-9",
"ISO-8859-13",
"JIS_X0201",
"x-JIS0208",
"JIS_X0212-1990",
"GB2312",
"EUC-KR",
"x-EUC-TW",
"EUC-JP",
"x-euc-jp-linux",
"KOI8-R",
"TIS-620",
"x-ISCII91",
"windows-1251",
"windows-1252",
"windows-1253",
"windows-1254",
"windows-1255",
"windows-1256",
"windows-1257",
"windows-1258",
"windows-932",
"x-mswin-936",
"x-windows-949",
"x-windows-950",
"windows-31j",
"Big5",
"Big5-HKSCS",
"x-MS950-HKSCS",
"ISO-2022-JP",
"ISO-2022-KR",
"x-ISO-2022-CN-CNS",
"x-ISO-2022-CN-GB",
"Big5-HKSCS",
"x-Johab",
"Shift_JIS"
};
// All charsets in utfNames should contain
// all charsets in charsetNames
return Arrays.stream(utfNames).flatMap(cs1 -> Arrays.stream(charsetNames)
.map(cs2 -> Arguments.of(Charset.forName(cs1), Charset.forName(cs2), true)));
}
private static Stream<Arguments> charsets() {
Charset us_ascii = Charset.forName("US-ASCII");
Charset iso_8859_1 = Charset.forName("ISO-8859-1");
Charset iso_8859_15 = Charset.forName("ISO-8859-15");
Charset utf_8 = Charset.forName("UTF-8");
Charset utf_16be = Charset.forName("UTF-16BE");
Charset cp1252 = Charset.forName("CP1252");
return Stream.of(
Arguments.of(us_ascii, us_ascii, true),
Arguments.of(us_ascii, iso_8859_1, false),
Arguments.of(us_ascii, iso_8859_15, false),
Arguments.of(us_ascii, utf_8, false),
Arguments.of(us_ascii, utf_16be, false),
Arguments.of(us_ascii, cp1252, false),
Arguments.of(iso_8859_1, us_ascii, true),
Arguments.of(iso_8859_1, iso_8859_1, true),
Arguments.of(iso_8859_1, iso_8859_15, false),
Arguments.of(iso_8859_1, utf_8, false),
Arguments.of(iso_8859_1, utf_16be, false),
Arguments.of(iso_8859_1, cp1252, false),
Arguments.of(iso_8859_15, us_ascii, true),
Arguments.of(iso_8859_15, iso_8859_1, false),
Arguments.of(iso_8859_15, iso_8859_15, true),
Arguments.of(iso_8859_15, utf_8, false),
Arguments.of(iso_8859_15, utf_16be, false),
Arguments.of(iso_8859_15, cp1252, false),
Arguments.of(utf_8, us_ascii, true),
Arguments.of(utf_8, iso_8859_1, true),
Arguments.of(utf_8, iso_8859_15, true),
Arguments.of(utf_8, utf_8, true),
Arguments.of(utf_8, utf_16be, true),
Arguments.of(utf_8, cp1252, true),
Arguments.of(utf_16be, us_ascii, true),
Arguments.of(utf_16be, iso_8859_1, true),
Arguments.of(utf_16be, iso_8859_15, true),
Arguments.of(utf_16be, utf_8, true),
Arguments.of(utf_16be, utf_16be, true),
Arguments.of(utf_16be, cp1252, true),
Arguments.of(cp1252, us_ascii, true),
Arguments.of(cp1252, iso_8859_1, false),
Arguments.of(cp1252, iso_8859_15, false),
Arguments.of(cp1252, utf_8, false),
Arguments.of(cp1252, utf_16be, false),
Arguments.of(cp1252, cp1252, true)
);
}
}