123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379 |
- "use strict";
- const DOMException = require("domexception");
- const xnv = require("xml-name-validator");
- const attributeUtils = require("./attributes");
- const { NAMESPACES, VOID_ELEMENTS, NODE_TYPES } = require("./constants");
- const XML_CHAR = /^(\x09|\x0A|\x0D|[\x20-\uD7FF]|[\uE000-\uFFFD]|(?:[\uD800-\uDBFF][\uDC00-\uDFFF]))*$/;
- const PUBID_CHAR = /^(\x20|\x0D|\x0A|[a-zA-Z0-9]|[-'()+,./:=?;!*#@$_%])*$/;
- function asciiCaseInsensitiveMatch(a, b) {
- if (a.length !== b.length) {
- return false;
- }
- for (let i = 0; i < a.length; ++i) {
- if ((a.charCodeAt(i) | 32) !== (b.charCodeAt(i) | 32)) {
- return false;
- }
- }
- return true;
- }
- function recordNamespaceInformation(element, map, prefixMap) {
- let defaultNamespaceAttrValue = null;
- for (let i = 0; i < element.attributes.length; ++i) {
- const attr = element.attributes[i];
- if (attr.namespaceURI === NAMESPACES.XMLNS) {
- if (attr.prefix === null) {
- defaultNamespaceAttrValue = attr.value;
- continue;
- }
- let namespaceDefinition = attr.value;
- if (namespaceDefinition === NAMESPACES.XML) {
- continue;
- }
- // This is exactly the other way than the spec says, but that's intended.
- // All the maps coalesce null to the empty string (explained in the
- // spec), so instead of doing that every time, just do it once here.
- if (namespaceDefinition === null) {
- namespaceDefinition = "";
- }
- if (
- namespaceDefinition in map &&
- map[namespaceDefinition].includes(attr.localName)
- ) {
- continue;
- }
- if (!(namespaceDefinition in map)) {
- map[namespaceDefinition] = [];
- }
- map[namespaceDefinition].push(attr.localName);
- prefixMap[attr.localName] = namespaceDefinition;
- }
- }
- return defaultNamespaceAttrValue;
- }
- function serializeDocumentType(node, namespace, prefixMap, requireWellFormed) {
- if (requireWellFormed && !PUBID_CHAR.test(node.publicId)) {
- throw new Error("Node publicId is not well formed");
- }
- if (
- requireWellFormed &&
- (!XML_CHAR.test(node.systemId) ||
- (node.systemId.includes('"') && node.systemId.includes("'")))
- ) {
- throw new Error("Node systemId is not well formed");
- }
- let markup = `<!DOCTYPE ${node.name}`;
- if (node.publicId !== "") {
- markup += ` PUBLIC "${node.publicId}"`;
- } else if (node.systemId !== "") {
- markup += " SYSTEM";
- }
- if (node.systemId !== "") {
- markup += ` "${node.systemId}"`;
- }
- return markup + ">";
- }
- function serializeProcessingInstruction(
- node,
- namespace,
- prefixMap,
- requireWellFormed
- ) {
- if (
- requireWellFormed &&
- (node.target.includes(":") || asciiCaseInsensitiveMatch(node.target, "xml"))
- ) {
- throw new Error("Node target is not well formed");
- }
- if (
- requireWellFormed &&
- (!XML_CHAR.test(node.data) || node.data.includes("?>"))
- ) {
- throw new Error("Node data is not well formed");
- }
- return `<?${node.target} ${node.data}?>`;
- }
- function serializeDocument(
- node,
- namespace,
- prefixMap,
- requireWellFormed,
- refs
- ) {
- if (requireWellFormed && node.documentElement === null) {
- throw new Error("Document does not have a document element");
- }
- let serializedDocument = "";
- for (const child of node.childNodes) {
- serializedDocument += xmlSerialization(
- child,
- namespace,
- prefixMap,
- requireWellFormed,
- refs
- );
- }
- return serializedDocument;
- }
- function serializeDocumentFragment(
- node,
- namespace,
- prefixMap,
- requireWellFormed,
- refs
- ) {
- let markup = "";
- for (const child of node.childNodes) {
- markup += xmlSerialization(
- child,
- namespace,
- prefixMap,
- requireWellFormed,
- refs
- );
- }
- return markup;
- }
- function serializeText(node, namespace, prefixMap, requireWellFormed) {
- if (requireWellFormed && !XML_CHAR.test(node.data)) {
- throw new Error("Node data is not well formed");
- }
- return node.data
- .replace(/&/g, "&")
- .replace(/</g, "<")
- .replace(/>/g, ">");
- }
- function serializeComment(node, namespace, prefixMap, requireWellFormed) {
- if (requireWellFormed && !XML_CHAR.test(node.data)) {
- throw new Error("Node data is not well formed");
- }
- if (
- requireWellFormed &&
- (node.data.includes("--") || node.data.endsWith("-"))
- ) {
- throw new Error("Found hyphens in illegal places");
- }
- return `<!--${node.data}-->`;
- }
- function serializeElement(node, namespace, prefixMap, requireWellFormed, refs) {
- if (
- requireWellFormed &&
- (node.localName.includes(":") || !xnv.name(node.localName))
- ) {
- throw new Error("localName is not a valid XML name");
- }
- let markup = "<";
- let qualifiedName = "";
- let skipEndTag = false;
- let ignoreNamespaceDefinitionAttr = false;
- const map = Object.assign({}, prefixMap);
- const localPrefixesMap = Object.create(null);
- const localDefaultNamespace = recordNamespaceInformation(
- node,
- map,
- localPrefixesMap
- );
- let inheritedNs = namespace;
- const ns = node.namespaceURI;
- if (inheritedNs === ns) {
- if (localDefaultNamespace !== null) {
- ignoreNamespaceDefinitionAttr = true;
- }
- if (ns === NAMESPACES.XML) {
- qualifiedName = "xml:" + node.localName;
- } else {
- qualifiedName = node.localName;
- }
- markup += qualifiedName;
- } else {
- let { prefix } = node;
- let candidatePrefix = attributeUtils.preferredPrefixString(map, ns, prefix);
- if (prefix === "xmlns") {
- if (requireWellFormed) {
- throw new Error("Elements can't have xmlns prefix");
- }
- candidatePrefix = "xmlns";
- }
- if (candidatePrefix !== null) {
- qualifiedName = candidatePrefix + ":" + node.localName;
- if (
- localDefaultNamespace !== null &&
- localDefaultNamespace !== NAMESPACES.XML
- ) {
- inheritedNs =
- localDefaultNamespace === "" ? null : localDefaultNamespace;
- }
- markup += qualifiedName;
- } else if (prefix !== null) {
- if (prefix in localPrefixesMap) {
- prefix = attributeUtils.generatePrefix(map, ns, refs.prefixIndex++);
- }
- if (map[ns]) {
- map[ns].push(prefix);
- } else {
- map[ns] = [prefix];
- }
- qualifiedName = prefix + ":" + node.localName;
- markup += `${qualifiedName} xmlns:${prefix}="${attributeUtils.serializeAttributeValue(
- ns,
- requireWellFormed
- )}"`;
- if (localDefaultNamespace !== null) {
- inheritedNs =
- localDefaultNamespace === "" ? null : localDefaultNamespace;
- }
- } else if (localDefaultNamespace === null || localDefaultNamespace !== ns) {
- ignoreNamespaceDefinitionAttr = true;
- qualifiedName = node.localName;
- inheritedNs = ns;
- markup += `${qualifiedName} xmlns="${attributeUtils.serializeAttributeValue(
- ns,
- requireWellFormed
- )}"`;
- } else {
- qualifiedName = node.localName;
- inheritedNs = ns;
- markup += qualifiedName;
- }
- }
- markup += attributeUtils.serializeAttributes(
- node,
- map,
- localPrefixesMap,
- ignoreNamespaceDefinitionAttr,
- requireWellFormed,
- refs
- );
- if (
- ns === NAMESPACES.HTML &&
- node.childNodes.length === 0 &&
- VOID_ELEMENTS.has(node.localName)
- ) {
- markup += " /";
- skipEndTag = true;
- } else if (ns !== NAMESPACES.HTML && node.childNodes.length === 0) {
- markup += "/";
- skipEndTag = true;
- }
- markup += ">";
- if (skipEndTag) {
- return markup;
- }
- if (ns === NAMESPACES.HTML && node.localName === "template") {
- markup += xmlSerialization(
- node.content,
- inheritedNs,
- map,
- requireWellFormed,
- refs
- );
- } else {
- for (const child of node.childNodes) {
- markup += xmlSerialization(
- child,
- inheritedNs,
- map,
- requireWellFormed,
- refs
- );
- }
- }
- markup += `</${qualifiedName}>`;
- return markup;
- }
- function serializeCDATASection(node) {
- return "<![CDATA[" + node.data + "]]>";
- }
- /**
- * @param {{prefixIndex: number}} refs
- */
- function xmlSerialization(node, namespace, prefixMap, requireWellFormed, refs) {
- switch (node.nodeType) {
- case NODE_TYPES.ELEMENT_NODE:
- return serializeElement(
- node,
- namespace,
- prefixMap,
- requireWellFormed,
- refs
- );
- case NODE_TYPES.DOCUMENT_NODE:
- return serializeDocument(
- node,
- namespace,
- prefixMap,
- requireWellFormed,
- refs
- );
- case NODE_TYPES.COMMENT_NODE:
- return serializeComment(node, namespace, prefixMap, requireWellFormed);
- case NODE_TYPES.TEXT_NODE:
- return serializeText(node, namespace, prefixMap, requireWellFormed);
- case NODE_TYPES.DOCUMENT_FRAGMENT_NODE:
- return serializeDocumentFragment(
- node,
- namespace,
- prefixMap,
- requireWellFormed,
- refs
- );
- case NODE_TYPES.DOCUMENT_TYPE_NODE:
- return serializeDocumentType(
- node,
- namespace,
- prefixMap,
- requireWellFormed
- );
- case NODE_TYPES.PROCESSING_INSTRUCTION_NODE:
- return serializeProcessingInstruction(
- node,
- namespace,
- prefixMap,
- requireWellFormed
- );
- case NODE_TYPES.ATTRIBUTE_NODE:
- return "";
- case NODE_TYPES.CDATA_SECTION_NODE:
- return serializeCDATASection(node);
- default:
- throw new TypeError("Only Nodes and Attr objects can be serialized");
- }
- }
- module.exports.produceXMLSerialization = (root, requireWellFormed) => {
- const namespacePrefixMap = Object.create(null);
- namespacePrefixMap["http://www.w3.org/XML/1998/namespace"] = ["xml"];
- try {
- return xmlSerialization(root, null, namespacePrefixMap, requireWellFormed, {
- prefixIndex: 1
- });
- } catch (e) {
- throw new DOMException(
- "Failed to serialize XML: " + e.message,
- "InvalidStateError"
- );
- }
- };
|