123 lines
5.2 KiB
JavaScript
123 lines
5.2 KiB
JavaScript
/* Test case for bug 340714
|
||
*
|
||
* Uses nsIConverterInputStream to decode UTF-16 text with all combinations
|
||
* of UTF-16BE and UTF-16LE with and without BOM.
|
||
*
|
||
* Sample text is: "Все счастливые семьи похожи друг на друга, каждая несчастливая семья несчастлива по-своему."
|
||
*
|
||
* The enclosing quotation marks are included in the sample text to test that
|
||
* UTF-16LE is recognized even when there is no BOM and the UTF-16LE decoder is
|
||
* not explicitly called. This only works when the first character of the text
|
||
* is an eight-bit character.
|
||
*/
|
||
|
||
const { NetUtil } = ChromeUtils.importESModule(
|
||
"resource://gre/modules/NetUtil.sys.mjs"
|
||
);
|
||
|
||
const beBOM = "%FE%FF";
|
||
const leBOM = "%FF%FE";
|
||
const sampleUTF16BE =
|
||
"%00%22%04%12%04%41%04%35%00%20%04%41%04%47%04%30%04%41%04%42%04%3B%04%38%04%32%04%4B%04%35%00%20%04%41%04%35%04%3C%04%4C%04%38%00%20%04%3F%04%3E%04%45%04%3E%04%36%04%38%00%20%04%34%04%40%04%43%04%33%00%20%04%3D%04%30%00%20%04%34%04%40%04%43%04%33%04%30%00%2C%00%20%04%3A%04%30%04%36%04%34%04%30%04%4F%00%20%04%3D%04%35%04%41%04%47%04%30%04%41%04%42%04%3B%04%38%04%32%04%30%04%4F%00%20%04%41%04%35%04%3C%04%4C%04%4F%00%20%04%3D%04%35%04%41%04%47%04%30%04%41%04%42%04%3B%04%38%04%32%04%30%00%20%04%3F%04%3E%00%2D%04%41%04%32%04%3E%04%35%04%3C%04%43%00%2E%00%22";
|
||
const sampleUTF16LE =
|
||
"%22%00%12%04%41%04%35%04%20%00%41%04%47%04%30%04%41%04%42%04%3B%04%38%04%32%04%4B%04%35%04%20%00%41%04%35%04%3C%04%4C%04%38%04%20%00%3F%04%3E%04%45%04%3E%04%36%04%38%04%20%00%34%04%40%04%43%04%33%04%20%00%3D%04%30%04%20%00%34%04%40%04%43%04%33%04%30%04%2C%00%20%00%3A%04%30%04%36%04%34%04%30%04%4F%04%20%00%3D%04%35%04%41%04%47%04%30%04%41%04%42%04%3B%04%38%04%32%04%30%04%4F%04%20%00%41%04%35%04%3C%04%4C%04%4F%04%20%00%3D%04%35%04%41%04%47%04%30%04%41%04%42%04%3B%04%38%04%32%04%30%04%20%00%3F%04%3E%04%2D%00%41%04%32%04%3E%04%35%04%3C%04%43%04%2E%00%22%00";
|
||
const expected =
|
||
'"\u0412\u0441\u0435 \u0441\u0447\u0430\u0441\u0442\u043B\u0438\u0432\u044B\u0435 \u0441\u0435\u043C\u044C\u0438 \u043F\u043E\u0445\u043E\u0436\u0438 \u0434\u0440\u0443\u0433 \u043D\u0430 \u0434\u0440\u0443\u0433\u0430, \u043A\u0430\u0436\u0434\u0430\u044F \u043D\u0435\u0441\u0447\u0430\u0441\u0442\u043B\u0438\u0432\u0430\u044F \u0441\u0435\u043C\u044C\u044F \u043D\u0435\u0441\u0447\u0430\u0441\u0442\u043B\u0438\u0432\u0430 \u043F\u043E-\u0441\u0432\u043E\u0435\u043C\u0443."';
|
||
|
||
Services.prefs.setBoolPref("security.allow_eval_with_system_principal", true);
|
||
registerCleanupFunction(() => {
|
||
Services.prefs.clearUserPref("security.allow_eval_with_system_principal");
|
||
});
|
||
|
||
function makeText(withBOM, charset) {
|
||
const isBE = charset === "UTF16BE";
|
||
const sampleText = isBE ? sampleUTF16BE : sampleUTF16LE;
|
||
const bom = isBE ? beBOM : leBOM;
|
||
return withBOM ? bom + sampleText : sampleText;
|
||
}
|
||
|
||
function testCase(withBOM, charset, charsetDec, decoder, bufferLength) {
|
||
var dataURI =
|
||
"data:text/plain;charset=" + charsetDec + "," + makeText(withBOM, charset);
|
||
|
||
var ConverterInputStream = Components.Constructor(
|
||
"@mozilla.org/intl/converter-input-stream;1",
|
||
"nsIConverterInputStream",
|
||
"init"
|
||
);
|
||
|
||
var channel = NetUtil.newChannel({
|
||
uri: dataURI,
|
||
loadUsingSystemPrincipal: true,
|
||
});
|
||
var testInputStream = channel.open();
|
||
var testConverter = new ConverterInputStream(
|
||
testInputStream,
|
||
decoder,
|
||
bufferLength,
|
||
0xfffd
|
||
);
|
||
|
||
if (!(testConverter instanceof Ci.nsIUnicharLineInputStream)) {
|
||
throw new Error("not line input stream");
|
||
}
|
||
|
||
var outStr = "";
|
||
var more;
|
||
do {
|
||
// read the line and check for eof
|
||
var line = {};
|
||
more = testConverter.readLine(line);
|
||
outStr += line.value;
|
||
} while (more);
|
||
|
||
if (outStr != expected) {
|
||
dump(
|
||
"Failed with BOM = " +
|
||
withBOM +
|
||
"; charset = " +
|
||
charset +
|
||
"; charset declaration = " +
|
||
charsetDec +
|
||
"; decoder = " +
|
||
decoder +
|
||
"; bufferLength = " +
|
||
bufferLength +
|
||
"\n"
|
||
);
|
||
if (outStr.length == expected.length) {
|
||
for (let i = 0; i < outStr.length; ++i) {
|
||
if (outStr.charCodeAt(i) != expected.charCodeAt(i)) {
|
||
dump(
|
||
i +
|
||
": " +
|
||
outStr.charCodeAt(i).toString(16) +
|
||
" != " +
|
||
expected.charCodeAt(i).toString(16) +
|
||
"\n"
|
||
);
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
// escape the strings before comparing for better readability
|
||
Assert.equal(escape(outStr), escape(expected));
|
||
}
|
||
|
||
function run_test() {
|
||
/* BOM charset charset decoder buffer
|
||
declaration length */
|
||
testCase(true, "UTF16LE", "UTF-16", "UTF-16BE", 64);
|
||
testCase(true, "UTF16BE", "UTF-16", "UTF-16LE", 64);
|
||
testCase(true, "UTF16LE", "UTF-16", "UTF-16LE", 64);
|
||
testCase(true, "UTF16BE", "UTF-16", "UTF-16BE", 64);
|
||
testCase(false, "UTF16LE", "UTF-16", "UTF-16LE", 64);
|
||
testCase(false, "UTF16BE", "UTF-16", "UTF-16BE", 64);
|
||
testCase(true, "UTF16LE", "UTF-16", "UTF-16BE", 65);
|
||
testCase(true, "UTF16BE", "UTF-16", "UTF-16LE", 65);
|
||
testCase(true, "UTF16LE", "UTF-16", "UTF-16LE", 65);
|
||
testCase(true, "UTF16BE", "UTF-16", "UTF-16BE", 65);
|
||
testCase(false, "UTF16LE", "UTF-16", "UTF-16LE", 65);
|
||
testCase(false, "UTF16BE", "UTF-16", "UTF-16BE", 65);
|
||
}
|