0
0
mirror of https://github.com/nodejs/node.git synced 2024-12-01 16:10:02 +01:00
nodejs/test/fixtures/wpt/encoding/legacy-mb-korean/euc-kr/euckr-encoder.js
Joyee Cheung 8906e5209b
test: pull enconding WPT test fixtures
PR-URL: https://github.com/nodejs/node/pull/25321
Reviewed-By: Rich Trott <rtrott@gmail.com>
Reviewed-By: James M Snell <jasnell@gmail.com>
Reviewed-By: Ruben Bridgewater <ruben@bridgewater.de>
2019-01-10 19:54:55 +08:00

106 lines
2.3 KiB
JavaScript

var euckrCPs = []; // index is unicode cp, value is pointer
for (p = 0; p < euckr.length; p++) {
if (euckr[p] != null && euckrCPs[euckr[p]] == null) {
euckrCPs[euckr[p]] = p;
}
}
function chars2cps(chars) {
// this is needed because of javascript's handling of supplementary characters
// char: a string of unicode characters
// returns an array of decimal code point values
var haut = 0;
var out = [];
for (var i = 0; i < chars.length; i++) {
var b = chars.charCodeAt(i);
if (b < 0 || b > 0xffff) {
alert("Error in chars2cps: byte out of range " + b.toString(16) + "!");
}
if (haut != 0) {
if (0xdc00 <= b && b <= 0xdfff) {
out.push(0x10000 + ((haut - 0xd800) << 10) + (b - 0xdc00));
haut = 0;
continue;
} else {
alert(
"Error in chars2cps: surrogate out of range " +
haut.toString(16) +
"!"
);
haut = 0;
}
}
if (0xd800 <= b && b <= 0xdbff) {
haut = b;
} else {
out.push(b);
}
}
return out;
}
function euckrEncoder(stream) {
cps = chars2cps(stream);
var out = "";
var cp;
var finished = false;
var endofstream = 2000000;
while (!finished) {
if (cps.length == 0) cp = endofstream;
else cp = cps.shift();
if (cp == endofstream) {
finished = true;
continue;
}
if (cp >= 0x00 && cp <= 0x7f) {
// ASCII
out += " " + cp.toString(16).toUpperCase();
continue;
}
var ptr = euckrCPs[cp];
if (ptr == null) {
return null;
// out += ' &#'+cp+';'
// continue
}
var lead = Math.floor(ptr / 190) + 0x81;
var trail = ptr % 190 + 0x41;
out +=
" " +
lead.toString(16).toUpperCase() +
" " +
trail.toString(16).toUpperCase();
}
return out.trim();
}
function convertToHex(str) {
// converts a string of ASCII characters to hex byte codes
var out = "";
var result;
for (var c = 0; c < str.length; c++) {
result = str.charCodeAt(c).toString(16).toUpperCase() + " ";
out += result;
}
return out;
}
function normalizeStr(str) {
var out = "";
for (var c = 0; c < str.length; c++) {
if (str.charAt(c) == "%") {
out += String.fromCodePoint(
parseInt(str.charAt(c + 1) + str.charAt(c + 2), 16)
);
c += 2;
} else out += str.charAt(c);
}
var result = "";
for (var o = 0; o < out.length; o++) {
result += "%" + out.charCodeAt(o).toString(16).toUpperCase();
}
return result.replace(/%1B%28%42$/, "");
}