зеркало из https://github.com/mozilla/gecko-dev.git
109 строки
2.9 KiB
JavaScript
109 строки
2.9 KiB
JavaScript
const encoders = {
|
|
xml: doc => {
|
|
let enc = Cu.createDocumentEncoder("text/xml");
|
|
enc.init(doc, "text/xml", Ci.nsIDocumentEncoder.OutputLFLineBreak);
|
|
return enc;
|
|
},
|
|
html: doc => {
|
|
let enc = Cu.createDocumentEncoder("text/html");
|
|
enc.init(doc, "text/html", Ci.nsIDocumentEncoder.OutputLFLineBreak);
|
|
return enc;
|
|
},
|
|
htmlBasic: doc => {
|
|
let enc = Cu.createDocumentEncoder("text/html");
|
|
enc.init(
|
|
doc,
|
|
"text/html",
|
|
Ci.nsIDocumentEncoder.OutputEncodeBasicEntities |
|
|
Ci.nsIDocumentEncoder.OutputLFLineBreak
|
|
);
|
|
return enc;
|
|
},
|
|
xhtml: doc => {
|
|
let enc = Cu.createDocumentEncoder("application/xhtml+xml");
|
|
enc.init(
|
|
doc,
|
|
"application/xhtml+xml",
|
|
Ci.nsIDocumentEncoder.OutputLFLineBreak
|
|
);
|
|
return enc;
|
|
},
|
|
};
|
|
|
|
// Which characters should we encode as entities? It depends on the serializer.
|
|
const encodeAll = { html: true, htmlBasic: true, xhtml: true, xml: true };
|
|
const encodeHTMLBasic = {
|
|
html: false,
|
|
htmlBasic: true,
|
|
xhtml: false,
|
|
xml: false,
|
|
};
|
|
const encodeXML = { html: false, htmlBasic: false, xhtml: true, xml: true };
|
|
const encodeNone = { html: false, htmlBasic: false, xhtml: false, xml: false };
|
|
const encodingInfoMap = new Map([
|
|
// Basic sanity chars '<', '>', '"', '&' get encoded in all cases.
|
|
["<", encodeAll],
|
|
[">", encodeAll],
|
|
['"', encodeAll],
|
|
["&", encodeAll],
|
|
// nbsp is only encoded with the HTML encoder when encoding basic entities.
|
|
["\xA0", encodeHTMLBasic],
|
|
// Whitespace bits are only encoded in XML.
|
|
["\n", encodeXML],
|
|
["\r", encodeXML],
|
|
["\t", encodeXML],
|
|
]);
|
|
|
|
const encodingMap = new Map([
|
|
["<", "<"],
|
|
[">", ">"],
|
|
['"', """],
|
|
["&", "&"],
|
|
["\xA0", " "],
|
|
["\n", "
"],
|
|
["\r", "
"],
|
|
["\t", "	"],
|
|
]);
|
|
|
|
function encodingInfoForChar(c) {
|
|
var info = encodingInfoMap.get(c);
|
|
if (info) {
|
|
return info;
|
|
}
|
|
return encodeNone;
|
|
}
|
|
|
|
function encodingForChar(c, type) {
|
|
var info = encodingInfoForChar(c);
|
|
if (!info[type]) {
|
|
return c;
|
|
}
|
|
return encodingMap.get(c);
|
|
}
|
|
|
|
const doc = new DOMParser().parseFromString("<root></root>", "text/xml");
|
|
const root = doc.documentElement;
|
|
for (let i = 0; i < 255; ++i) {
|
|
let el = doc.createElement("span");
|
|
el.setAttribute("x", String.fromCharCode(i));
|
|
el.textContent = " ";
|
|
root.appendChild(el);
|
|
}
|
|
for (let type of ["xml", "xhtml", "htmlBasic", "html"]) {
|
|
let str = encoders[type](doc).encodeToString();
|
|
const prefix = '<root><span x="';
|
|
const suffix = '"> </span></root>';
|
|
Assert.ok(str.startsWith(prefix), `${type} serialization starts correctly`);
|
|
Assert.ok(str.endsWith(suffix), `${type} serialization ends correctly`);
|
|
str = str.substring(prefix.length, str.length - suffix.length);
|
|
let encodings = str.split('"> </span><span x="');
|
|
for (let i = 0; i < 255; ++i) {
|
|
let c = String.fromCharCode(i);
|
|
Assert.equal(
|
|
encodingForChar(c, type),
|
|
encodings[i],
|
|
`${type} encoding of char ${i} is correct`
|
|
);
|
|
}
|
|
}
|