/*
* test_TextDecoderOptions.js
* bug 764234 tests
*/
/* eslint-env mozilla/testharness */
function runTextDecoderOptions() {
const data = [
0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, 0xa8, 0xa9, 0xaa, 0xab,
0xac, 0xad, 0xae, 0xaf, 0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf, 0xc0, 0xc1, 0xc2, 0xc3,
0xc4, 0xc5, 0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda, 0xdf,
0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9, 0xea, 0xeb,
0xec, 0xed, 0xee, 0xef, 0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
0xf8, 0xf9, 0xfa, 0xfb,
];
const expectedString =
"\u00a0\u0e01\u0e02\u0e03\u0e04\u0e05\u0e06\u0e07" +
"\u0e08\u0e09\u0e0a\u0e0b\u0e0c\u0e0d\u0e0e\u0e0f" +
"\u0e10\u0e11\u0e12\u0e13\u0e14\u0e15\u0e16\u0e17" +
"\u0e18\u0e19\u0e1a\u0e1b\u0e1c\u0e1d\u0e1e\u0e1f" +
"\u0e20\u0e21\u0e22\u0e23\u0e24\u0e25\u0e26\u0e27" +
"\u0e28\u0e29\u0e2a\u0e2b\u0e2c\u0e2d\u0e2e\u0e2f" +
"\u0e30\u0e31\u0e32\u0e33\u0e34\u0e35\u0e36\u0e37" +
"\u0e38\u0e39\u0e3a\u0e3f\u0e40\u0e41\u0e42\u0e43" +
"\u0e44\u0e45\u0e46\u0e47\u0e48\u0e49\u0e4a\u0e4b" +
"\u0e4c\u0e4d\u0e4e\u0e4f\u0e50\u0e51\u0e52\u0e53" +
"\u0e54\u0e55\u0e56\u0e57\u0e58\u0e59\u0e5a\u0e5b" ;
test(testDecoderGetEncoding, "testDecoderGetEncoding" );
test(testDecodeGreek, "testDecodeGreek" );
test(function () {
testConstructorFatalOption(data, expectedString);
}, "testConstructorFatalOption" );
test(function () {
testConstructorEncodingOption(data, expectedString);
}, "testConstructorEncodingOption" );
test(function () {
testDecodeStreamOption(data, expectedString);
}, "testDecodeStreamOption" );
test(testDecodeStreamCompositions, "testDecodeStreamCompositions" );
test(function () {
testDecodeABVOption(data, expectedString);
}, "testDecodeABVOption" );
test(testDecoderForThaiEncoding, "testDecoderForThaiEncoding" );
test(testInvalid2022JP, "testInvalid2022JP" );
test(testDecoderForBig5, "testDecoderForBig5" );
}
/*
* function testConstructor()
*
* - This function tests the constructor optional arguments.
* - Stream option remains null for this test.
* - The stream option is passed to the decode function.
* - This function is not testing the decode function.
*
*/
function testConstructorFatalOption() {
//invalid string to decode passed, fatal = false
testCharset({
fatal: false ,
encoding: "iso-8859-11" ,
input: [],
expected: "" ,
msg: "constructor fatal option set to false test." ,
});
//invalid string to decode passed, fatal = true
testCharset({
fatal: true ,
encoding: "iso-8859-11" ,
input: [],
expected: "" ,
msg: "constructor fatal option set to true test." ,
});
}
function testConstructorEncodingOption(aData, aExpectedString) {
function errorMessage(encoding) {
return `TextDecoder constructor: The given encoding '${String(
encoding
).trim()}' is not supported.`;
}
// valid encoding passed
var encoding = "iso-8859-11" ;
testCharset({
encoding,
input: aData,
expected: aExpectedString,
msg: "decoder testing constructor valid encoding." ,
});
// passing spaces for encoding
encoding = " " ;
testCharset({
encoding,
input: aData,
error: "RangeError" ,
errorMessage: errorMessage(encoding),
msg: "constructor encoding, spaces encoding test." ,
});
// invalid encoding passed
encoding = "asdfasdf" ;
testCharset({
encoding,
input: aData,
error: "RangeError" ,
errorMessage: errorMessage(encoding),
msg: "constructor encoding, invalid encoding test." ,
});
// null encoding passed
encoding = null ;
testCharset({
encoding,
input: aData,
error: "RangeError" ,
errorMessage: errorMessage(encoding),
msg: 'constructor encoding, "null" encoding test.' ,
});
// empty encoding passed
encoding = "" ;
testCharset({
encoding,
input: aData,
error: "RangeError" ,
errorMessage: errorMessage(encoding),
msg: "constructor encoding, empty encoding test." ,
});
// replacement character test
aExpectedString =
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" +
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" +
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" +
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" +
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" +
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" +
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" +
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" +
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" +
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" +
"\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd\ufffd" ;
testCharset({
encoding: "utf-8" ,
input: aData,
expected: aExpectedString,
msg: "constuctor encoding, utf-8 test." ,
});
}
/*
* function testDecodeStreamOption()
*
* - fatal remains null for the entire test
* - encoding remains as "iso-8859-11"
* - The stream option is modified for this test.
* - ArrayBufferView is modified for this test.
*/
function testDecodeStreamOption(data, expectedString) {
const streamData = [];
const expectedStreamString = [];
const chunkSize = data.length / 3;
for (let i = 0; i < data.length; i += chunkSize) {
streamData.push(data.slice(i, i + chunkSize));
expectedStreamString.push(expectedString.slice(i, i + chunkSize));
}
// streaming test
/* - the streaming is null
* - streaming is not set in the decode function
*/
testCharset({
encoding: "iso-8859-11" ,
array: [
{ input: streamData[0], expected: expectedStreamString[0] },
{ input: streamData[1], expected: expectedStreamString[1] },
{ input: streamData[2], expected: expectedStreamString[2] },
],
msg: "decode() stream test zero." ,
});
testCharset({
encoding: "iso-8859-11" ,
array: [
{ input: streamData[0], expected: expectedStreamString[0], stream: true },
{ input: streamData[1], expected: expectedStreamString[1], stream: true },
{ input: streamData[2], expected: expectedStreamString[2], stream: true },
],
msg: "decode() stream test one." ,
});
testCharset({
encoding: "iso-8859-11" ,
array: [
{ input: streamData[0], expected: expectedStreamString[0], stream: true },
{ input: streamData[1], expected: expectedStreamString[1] },
{ input: streamData[2], expected: expectedStreamString[2] },
],
msg: "decode() stream test two." ,
});
testCharset({
encoding: "utf-8" ,
array: [
{ input: [0xc2], expected: "\uFFFD" },
{ input: [0x80], expected: "\uFFFD" },
],
msg: "decode() stream test utf-8." ,
});
testCharset({
encoding: "utf-8" ,
fatal: true ,
array: [
{ input: [0xc2], error: "TypeError" },
{ input: [0x80], error: "TypeError" },
],
msg: "decode() stream test utf-8 fatal." ,
});
}
function testDecodeStreamCompositions() {
var tests = [
{ encoding: "utf-8" , input: [0xc2, 0x80], expected: ["" , "\x80" ] },
{
encoding: "utf-8" ,
input: [0xef, 0xbb, 0xbf, 0xc2, 0x80],
expected: ["" , "" , "" , "" , "\x80" ],
},
{ encoding: "utf-16" , input: [0x01, 0x00], expected: ["" , "\x01" ] },
{
encoding: "utf-16" ,
input: [0x01, 0x00, 0x03, 0x02],
expected: ["" , "\x01" , "" , "\u0203" ],
},
{ encoding: "utf-16" , input: [0xff, 0xfd], expected: ["" , "\uFDFF" ] },
{ encoding: "utf-16" , input: [0xff, 0xfe], expected: ["" , "" ] },
{ encoding: "utf-16" , input: [0xff, 0xff], expected: ["" , "\uFFFF" ] },
{
encoding: "utf-16" ,
input: [0xff, 0xfe, 0x01, 0x00],
expected: ["" , "" , "" , "\x01" ],
},
{
encoding: "utf-16" ,
input: [0xff, 0xfe, 0xff, 0xfe],
expected: ["" , "" , "" , "\uFEFF" ],
},
{
encoding: "utf-16" ,
input: [0xff, 0xfe, 0xfe, 0xff],
expected: ["" , "" , "" , "\uFFFE" ],
},
{ encoding: "utf-16" , input: [0xfd, 0xfe], expected: ["" , "\uFEFD" ] },
{ encoding: "utf-16" , input: [0xfd, 0xff], expected: ["" , "\uFFFD" ] },
{ encoding: "utf-16" , input: [0xfe, 0xfd], expected: ["" , "\uFDFE" ] },
{ encoding: "utf-16" , input: [0xfe, 0xfe], expected: ["" , "\uFEFE" ] },
{ encoding: "utf-16" , input: [0xfe, 0xff], expected: ["" , "\uFFFE" ] },
{
encoding: "utf-16" ,
input: [0xfe, 0xff, 0x01, 0x00],
expected: ["" , "\uFFFE" , "" , "\x01" ],
},
{
encoding: "utf-16" ,
input: [0xfe, 0xff, 0xff, 0xfe],
expected: ["" , "\uFFFE" , "" , "\uFEFF" ],
},
{
encoding: "utf-16" ,
input: [0xfe, 0xff, 0xfe, 0xff],
expected: ["" , "\uFFFE" , "" , "\uFFFE" ],
},
{ encoding: "utf-16le" , input: [0x01, 0x00], expected: ["" , "\x01" ] },
{
encoding: "utf-16le" ,
input: [0x01, 0x00, 0x03, 0x02],
expected: ["" , "\x01" , "" , "\u0203" ],
},
{
encoding: "utf-16le" ,
input: [0xff, 0xfe, 0x01, 0x00],
expected: ["" , "" , "" , "\x01" ],
},
{
encoding: "utf-16le" ,
input: [0xfe, 0xff, 0x01, 0x00],
expected: ["" , "\uFFFE" , "" , "\x01" ],
},
{ encoding: "utf-16be" , input: [0x01, 0x00], expected: ["" , "\u0100" ] },
{
encoding: "utf-16be" ,
input: [0x01, 0x00, 0x03, 0x02],
expected: ["" , "\u0100" , "" , "\u0302" ],
},
{ encoding: "utf-16be" , input: [0xfd, 0xfe], expected: ["" , "\uFDFE" ] },
{ encoding: "utf-16be" , input: [0xfd, 0xff], expected: ["" , "\uFDFF" ] },
{ encoding: "utf-16be" , input: [0xfe, 0xfd], expected: ["" , "\uFEFD" ] },
{ encoding: "utf-16be" , input: [0xfe, 0xfe], expected: ["" , "\uFEFE" ] },
{ encoding: "utf-16be" , input: [0xfe, 0xff], expected: ["" , "" ] },
{
encoding: "utf-16be" ,
input: [0xfe, 0xff, 0x01, 0x00],
expected: ["" , "" , "" , "\u0100" ],
},
{ encoding: "utf-16be" , input: [0xff, 0xfd], expected: ["" , "\uFFFD" ] },
{ encoding: "utf-16be" , input: [0xff, 0xfe], expected: ["" , "\uFFFE" ] },
{ encoding: "utf-16be" , input: [0xff, 0xff], expected: ["" , "\uFFFF" ] },
{
encoding: "utf-16be" ,
input: [0xff, 0xfe, 0x01, 0x00],
expected: ["" , "\uFFFE" , "" , "\u0100" ],
},
{ encoding: "shift_jis" , input: [0x81, 0x40], expected: ["" , "\u3000" ] },
];
tests.forEach(function (t) {
(function generateCompositions(a, n) {
a.push(n);
var l = a.length - 1;
var array = [];
for (var i = 0, o = 0; i <= l; i++) {
array.push({
input: t.input.slice(o, o + a[i]),
expected: t.expected.slice(o, (o += a[i])).join("" ),
stream: i < l,
});
}
testCharset({
encoding: t.encoding,
array,
msg: "decode() stream test " + t.encoding + " " + a.join("-" ) + "." ,
});
while (a[l] > 1) {
a[l]--;
generateCompositions(a.slice(0), n - a[l]);
}
})([], t.input.length);
});
}
/*
* function testDecodeABVOption()
*
* - ABV for ArrayBufferView
* - fatal remains null for the entire test
* - encoding remains as "iso-8859-11"
* - The stream option is modified for this test.
* - ArrayBufferView is modified for this test.
*/
function testDecodeABVOption(data, expectedString) {
// valid data
testCharset({
encoding: "iso-8859-11" ,
input: data,
expected: expectedString,
msg: "decode test ABV valid data." ,
});
// invalid empty data
testCharset({
encoding: "iso-8859-11" ,
input: [],
expected: "" ,
msg: "decode test ABV empty data." ,
});
// spaces
testCharset({
encoding: "iso-8859-11" ,
input: ["\u0020\u0020" ],
expected: "\0" ,
msg: "text decoding ABV string test." ,
});
testCharset({
encoding: "iso-8859-11" ,
input: ["" ],
expected: "\0" ,
msg: "text decoding ABV empty string test." ,
});
// null for Array Buffer
testCharset({
encoding: "iso-8859-11" ,
input: null ,
error: "TypeError" ,
msg: "text decoding ABV null test." ,
});
}
function testDecodeGreek() {
var data = [
0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, 0xa8, 0xa9, 0xaa, 0xab,
0xac, 0xad, 0xaf, 0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7, 0xb8,
0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf, 0xc0, 0xc1, 0xc2, 0xc3, 0xc4,
0xc5, 0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf, 0xd0,
0xd1, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd,
0xde, 0xdf, 0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9,
0xea, 0xeb, 0xec, 0xed, 0xee, 0xef, 0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5,
0xf6, 0xf7, 0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe,
];
var expectedString =
"\u00a0\u2018\u2019\u00a3\u20ac\u20af\u00a6\u00a7\u00a8" +
"\u00a9\u037a\u00ab\u00ac\u00ad\u2015\u00b0\u00b1" +
"\u00b2\u00b3\u0384\u0385\u0386\u00b7\u0388\u0389" +
"\u038a\u00bb\u038c\u00bd\u038e\u038f\u0390\u0391" +
"\u0392\u0393\u0394\u0395\u0396\u0397\u0398\u0399" +
"\u039a\u039b\u039c\u039d\u039e\u039f\u03a0\u03a1" +
"\u03a3\u03a4\u03a5\u03a6\u03a7\u03a8\u03a9\u03aa" +
"\u03ab\u03ac\u03ad\u03ae\u03af\u03b0\u03b1\u03b2" +
"\u03b3\u03b4\u03b5\u03b6\u03b7\u03b8\u03b9\u03ba" +
"\u03bb\u03bc\u03bd\u03be\u03bf\u03c0\u03c1\u03c2" +
"\u03c3\u03c4\u03c5\u03c6\u03c7\u03c8\u03c9\u03ca" +
"\u03cb\u03cc\u03cd\u03ce" ;
testCharset({
encoding: "greek" ,
input: data,
expected: expectedString,
msg: "decode greek test." ,
});
}
function testDecoderForThaiEncoding() {
// TEST One
const data = [
0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, 0xa8, 0xa9, 0xaa, 0xab,
0xac, 0xad, 0xae, 0xaf, 0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf, 0xc0, 0xc1, 0xc2, 0xc3,
0xc4, 0xc5, 0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda, 0xdf,
0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9, 0xea, 0xeb,
0xec, 0xed, 0xee, 0xef, 0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
0xf8, 0xf9, 0xfa, 0xfb,
];
const expectedString =
"\u00a0\u0e01\u0e02\u0e03\u0e04\u0e05\u0e06\u0e07\u0e08\u0e09\u0e0a\u0e0b\u0e0c\u0e0d\u0e0e\u0e0f\u0e10\u0e11\u0e12\u0e13\u0e14\u0e15\u0e16\u0e17\u0e18\u0e19\u0e1a\u0e1b\u0e1c\u0e1d\u0e1e\u0e1f\u0e20\u0e21\u0e22\u0e23\u0e24\u0e25\u0e26\u0e27\u0e28\u0e29\u0e2a\u0e2b\u0e2c\u0e2d\u0e2e\u0e2f\u0e30\u0e31\u0e32\u0e33\u0e34\u0e35\u0e36\u0e37\u0e38\u0e39\u0e3a\u0e3f\u0e40\u0e41\u0e42\u0e43\u0e44\u0e45\u0e46\u0e47\u0e48\u0e49\u0e4a\u0e4b\u0e4c\u0e4d\u0e4e\u0e4f\u0e50\u0e51\u0e52\u0e53\u0e54\u0e55\u0e56\u0e57\u0e58\u0e59\u0e5a\u0e5b" ;
testCharset({
encoding: "iso-8859-11" ,
input: data,
expected: expectedString,
msg: "decoder testing valid ISO-8859-11 encoding." ,
});
}
function testDecoderGetEncoding() {
var labelEncodings = [
{ encoding: "utf-8" , labels: ["unicode-1-1-utf-8" , "utf-8" , "utf8" ] },
{ encoding: "ibm866" , labels: ["866" , "cp866" , "csibm866" , "ibm866" ] },
{
encoding: "iso-8859-2" ,
labels: [
"csisolatin2" ,
"iso-8859-2" ,
"iso-ir-101" ,
"iso8859-2" ,
"iso88592" ,
"iso_8859-2" ,
"iso_8859-2:1987" ,
"l2" ,
"latin2" ,
],
},
{
encoding: "iso-8859-3" ,
labels: [
"csisolatin3" ,
"iso-8859-3" ,
"iso-ir-109" ,
"iso8859-3" ,
"iso88593" ,
"iso_8859-3" ,
"iso_8859-3:1988" ,
"l3" ,
"latin3" ,
],
},
{
encoding: "iso-8859-4" ,
labels: [
"csisolatin4" ,
"iso-8859-4" ,
"iso-ir-110" ,
"iso8859-4" ,
"iso88594" ,
"iso_8859-4" ,
"iso_8859-4:1988" ,
"l4" ,
"latin4" ,
],
},
{
encoding: "iso-8859-5" ,
labels: [
"csisolatincyrillic" ,
"cyrillic" ,
"iso-8859-5" ,
"iso-ir-144" ,
"iso8859-5" ,
"iso88595" ,
"iso_8859-5" ,
"iso_8859-5:1988" ,
],
},
{
encoding: "iso-8859-6" ,
labels: [
"arabic" ,
"asmo-708" ,
"csiso88596e" ,
"csiso88596i" ,
"csisolatinarabic" ,
"ecma-114" ,
"iso-8859-6" ,
"iso-8859-6-e" ,
"iso-8859-6-i" ,
"iso-ir-127" ,
"iso8859-6" ,
"iso88596" ,
"iso_8859-6" ,
"iso_8859-6:1987" ,
],
},
{
encoding: "iso-8859-7" ,
labels: [
"csisolatingreek" ,
"ecma-118" ,
"elot_928" ,
"greek" ,
"greek8" ,
"iso-8859-7" ,
"iso-ir-126" ,
"iso8859-7" ,
"iso88597" ,
"iso_8859-7" ,
"iso_8859-7:1987" ,
"sun_eu_greek" ,
],
},
{
encoding: "iso-8859-8" ,
labels: [
"csiso88598e" ,
"csisolatinhebrew" ,
"hebrew" ,
"iso-8859-8" ,
"iso-8859-8-e" ,
"iso-ir-138" ,
"iso8859-8" ,
"iso88598" ,
"iso_8859-8" ,
"iso_8859-8:1988" ,
"visual" ,
],
},
{
encoding: "iso-8859-8-i" ,
labels: ["csiso88598i" , "iso-8859-8-i" , "logical" ],
},
{
encoding: "iso-8859-10" ,
labels: [
"csisolatin6" ,
"iso-8859-10" ,
"iso-ir-157" ,
"iso8859-10" ,
"iso885910" ,
"l6" ,
"latin6" ,
],
},
{
encoding: "iso-8859-13" ,
labels: ["iso-8859-13" , "iso8859-13" , "iso885913" ],
},
{
encoding: "iso-8859-14" ,
labels: ["iso-8859-14" , "iso8859-14" , "iso885914" ],
},
{
encoding: "iso-8859-15" ,
labels: [
"csisolatin9" ,
"iso-8859-15" ,
"iso8859-15" ,
"iso885915" ,
"iso_8859-15" ,
"l9" ,
],
},
{ encoding: "iso-8859-16" , labels: ["iso-8859-16" ] },
{
encoding: "koi8-r" ,
labels: ["cskoi8r" , "koi" , "koi8" , "koi8-r" , "koi8_r" ],
},
{ encoding: "koi8-u" , labels: ["koi8-u" ] },
{
encoding: "macintosh" ,
labels: ["csmacintosh" , "mac" , "macintosh" , "x-mac-roman" ],
},
{
encoding: "windows-874" ,
labels: [
"dos-874" ,
"iso-8859-11" ,
"iso8859-11" ,
"iso885911" ,
"tis-620" ,
"windows-874" ,
],
},
{
encoding: "windows-1250" ,
labels: ["cp1250" , "windows-1250" , "x-cp1250" ],
},
{
encoding: "windows-1251" ,
labels: ["cp1251" , "windows-1251" , "x-cp1251" ],
},
{
encoding: "windows-1252" ,
labels: [
"ansi_x3.4-1968" ,
"ascii" ,
"cp1252" ,
"cp819" ,
"csisolatin1" ,
"ibm819" ,
"iso-8859-1" ,
"iso-ir-100" ,
"iso8859-1" ,
"iso88591" ,
"iso_8859-1" ,
"iso_8859-1:1987" ,
"l1" ,
"latin1" ,
"us-ascii" ,
"windows-1252" ,
"x-cp1252" ,
],
},
{
encoding: "windows-1253" ,
labels: ["cp1253" , "windows-1253" , "x-cp1253" ],
},
{
encoding: "windows-1254" ,
labels: [
"cp1254" ,
"csisolatin5" ,
"iso-8859-9" ,
"iso-ir-148" ,
"iso8859-9" ,
"iso88599" ,
"iso_8859-9" ,
"iso_8859-9:1989" ,
"l5" ,
"latin5" ,
"windows-1254" ,
"x-cp1254" ,
],
},
{
encoding: "windows-1255" ,
labels: ["cp1255" , "windows-1255" , "x-cp1255" ],
},
{
encoding: "windows-1256" ,
labels: ["cp1256" , "windows-1256" , "x-cp1256" ],
},
{
encoding: "windows-1257" ,
labels: ["cp1257" , "windows-1257" , "x-cp1257" ],
},
{
encoding: "windows-1258" ,
labels: ["cp1258" , "windows-1258" , "x-cp1258" ],
},
{
encoding: "x-mac-cyrillic" ,
labels: ["x-mac-cyrillic" , "x-mac-ukrainian" ],
},
{
encoding: "gbk" ,
labels: [
"chinese" ,
"csgb2312" ,
"csiso58gb231280" ,
"gb2312" ,
"gb_2312" ,
"gb_2312-80" ,
"gbk" ,
"iso-ir-58" ,
"x-gbk" ,
],
},
{ encoding: "gb18030" , labels: ["gb18030" ] },
{
encoding: "big5" ,
labels: ["big5" , "cn-big5" , "csbig5" , "x-x-big5" , "big5-hkscs" ],
},
{
encoding: "euc-jp" ,
labels: ["cseucpkdfmtjapanese" , "euc-jp" , "x-euc-jp" ],
},
{ encoding: "iso-2022-jp" , labels: ["csiso2022jp" , "iso-2022-jp" ] },
{
encoding: "shift_jis" ,
labels: [
"csshiftjis" ,
"ms932" ,
"ms_kanji" ,
"shift-jis" ,
"shift_jis" ,
"sjis" ,
"windows-31j" ,
"x-sjis" ,
],
},
{
encoding: "euc-kr" ,
labels: [
"cseuckr" ,
"csksc56011987" ,
"euc-kr" ,
"iso-ir-149" ,
"korean" ,
"ks_c_5601-1987" ,
"ks_c_5601-1989" ,
"ksc5601" ,
"ksc_5601" ,
"windows-949" ,
],
},
{ encoding: "utf-16le" , labels: ["utf-16" , "utf-16le" ] },
{ encoding: "utf-16be" , labels: ["utf-16be" ] },
{ encoding: "x-user-defined" , labels: ["x-user-defined" ] },
{
error: "RangeError" ,
labels: [
"x-windows-949" ,
"\u0130SO-8859-1" ,
"csiso2022kr" ,
"iso-2022-kr" ,
"iso-2022-cn" ,
"iso-2022-cn-ext" ,
"replacement" ,
"hz-gb-2312" ,
],
},
];
for (var le of labelEncodings) {
for (var label of le.labels) {
try {
var decoder = new TextDecoder(label);
} catch (e) {
assert_true(!!le.error, label + " shoud not throw " + e.name);
assert_equals(
e.name,
le.error,
label + " label encoding unsupported test."
);
continue ;
}
assert_true(!le.error, label + " shoud throw " + le.error);
assert_equals(
decoder.encoding,
le.encoding,
label + " label encoding test."
);
}
}
}
function testCharset(test) {
try {
var fatal = test.fatal ? { fatal: test.fatal } : null ;
var decoder = new TextDecoder(test.encoding, fatal);
} catch (e) {
assert_equals(
e.name,
test.error,
test.msg + " error thrown from the constructor."
);
if (test.errorMessage) {
assert_equals(
e.message,
test.errorMessage,
test.msg + " error thrown from the constructor."
);
}
return ;
}
var array = test.array || [test];
var num_strings = array.length;
for (var i = 0; i < num_strings; i++) {
var decodeView =
array[i].input !== null ? new Uint8Array(array[i].input) : null ;
var stream = array[i].stream ? { stream: array[i].stream } : null ;
var outText;
try {
outText = decoder.decode(decodeView, stream);
} catch (e) {
assert_equals(
e.name,
array[i].error,
test.msg + " error thrown from decode()."
);
return ;
}
var expected = array[i].expected;
if (outText !== expected) {
assert_equals(
escape(outText),
escape(expected),
test.msg + " Code points do not match expected code points."
);
break ;
}
}
assert_true(!test.error, test.msg);
}
function testInvalid2022JP() {
var inputs = [
[0x80],
[0x1b, 0xff],
[0x1b, 0x28, 0xff],
[0x1b, 0x24, 0x80],
[0x1b, 0x24, 0x28, 0x80],
[0x1b, 0x28, 0x4a, 0xff],
[0x1b, 0x28, 0x49, 0xff],
[0x1b, 0x24, 0x40, 0x20],
[0x1b, 0x24, 0x41, 0x20],
[0x1b, 0x24, 0x42, 0x20],
[0x1b, 0x24, 0x28, 0x43, 0x20],
[0x1b, 0x24, 0x28, 0x44, 0x20],
[0x1b, 0x24, 0x40, 0x80, 0x21],
[0x1b, 0x24, 0x41, 0xff, 0x21],
[0x1b, 0x24, 0x42, 0x80, 0x21],
[0x1b, 0x24, 0x28, 0x43, 0xff, 0x21],
[0x1b, 0x24, 0x28, 0x44, 0x80, 0x21],
[0x1b, 0x24, 0x40, 0x21, 0x20],
[0x1b, 0x24, 0x41, 0x21, 0x20],
[0x1b, 0x24, 0x42, 0x21, 0x20],
[0x1b, 0x24, 0x28, 0x43, 0x21, 0x20],
[0x1b, 0x24, 0x28, 0x44, 0x21, 0x20],
[0x1b, 0x2e, 0xff],
[0x1b, 0x4e, 0x20],
[0x1b, 0x4e, 0x7f],
[0x1b, 0x2e, 0x41, 0x1b, 0x4e, 0x80],
[0x1b, 0x2e, 0x41, 0x1b, 0x4e, 0xff],
];
var failureCount = 0;
inputs.forEach(function (input) {
try {
// decode() should never throw unless {fatal: true} is specified
new TextDecoder("iso-2022-jp" ).decode(new Uint8Array(input));
} catch (e) {
if (e.name !== "TypeError" ) {
throw e;
}
failureCount++;
}
});
assert_equals(
failureCount,
0,
failureCount + " of " + inputs.length + " tests failed"
);
}
function testDecoderForBig5() {
const inputs = [
[0x61, 0x62],
[0x87, 0x40],
[0xfe, 0xfe],
[0xfe, 0xfd],
[0x88, 0x62],
[0x88, 0x64],
[0x88, 0x66],
[0x88, 0xa3],
[0x88, 0xa5],
[0x88, 0xa7],
[0x99, 0xd4],
[0x99, 0xd5],
[0x99, 0xd6],
[0x61, 0x87, 0x40, 0x62],
[0x61, 0xfe, 0xfe, 0x62],
[0x61, 0xfe, 0xfd, 0x62],
[0x61, 0x88, 0x62, 0x62],
[0x61, 0x88, 0x64, 0x62],
[0x61, 0x88, 0x66, 0x62],
[0x61, 0x88, 0xa3, 0x62],
[0x61, 0x88, 0xa5, 0x62],
[0x61, 0x88, 0xa7, 0x62],
[0x61, 0x99, 0xd4, 0x62],
[0x61, 0x99, 0xd5, 0x62],
[0x61, 0x99, 0xd6, 0x62],
[0x80, 0x61],
[0xff, 0x61],
[0xfe, 0x39],
[0x87, 0x66],
[0x81, 0x40],
[0x61, 0x81],
];
const expectations = [
"\u0061\u0062" ,
"\u43F0" ,
"\u79D4" ,
"\uD864\uDD0D" ,
"\u00CA\u0304" ,
"\u00CA\u030C" ,
"\u00CA" ,
"\u00EA\u0304" ,
"\u00EA\u030C" ,
"\u00EA" ,
"\u8991" ,
"\uD85E\uDD67" ,
"\u8A29" ,
"\u0061\u43F0\u0062" ,
"\u0061\u79D4\u0062" ,
"\u0061\uD864\uDD0D\u0062" ,
"\u0061\u00CA\u0304\u0062" ,
"\u0061\u00CA\u030C\u0062" ,
"\u0061\u00CA\u0062" ,
"\u0061\u00EA\u0304\u0062" ,
"\u0061\u00EA\u030C\u0062" ,
"\u0061\u00EA\u0062" ,
"\u0061\u8991\u0062" ,
"\u0061\uD85E\uDD67\u0062" ,
"\u0061\u8A29\u0062" ,
"\uFFFD\u0061" ,
"\uFFFD\u0061" ,
"\uFFFD\u0039" ,
"\uFFFD\u0066" ,
"\uFFFD\u0040" ,
"\u0061\uFFFD" ,
];
for (var i = 0; i < inputs.length; i++) {
testCharset({
encoding: "big5" ,
input: inputs[i],
expected: expectations[i],
msg: "decoder test #" + i + " for big5." ,
});
}
}
quality 83%
¤ Dauer der Verarbeitung: 0.20 Sekunden
(vorverarbeitet)
¤
*© Formatika GbR, Deutschland