2020-12-18 22:06:30 +00:00
|
|
|
(function(f){if(typeof exports==="object"&&typeof module!=="undefined"){module.exports=f()}else if(typeof define==="function"&&define.amd){define([],f)}else{var g;if(typeof window!=="undefined"){g=window}else if(typeof global!=="undefined"){g=global}else if(typeof self!=="undefined"){g=self}else{g=this}g.parse5 = f()}})(function(){var define,module,exports;return (function(){function r(e,n,t){function o(i,f){if(!n[i]){if(!e[i]){var c="function"==typeof require&&require;if(!f&&c)return c(i,!0);if(u)return u(i,!0);var a=new Error("Cannot find module '"+i+"'");throw a.code="MODULE_NOT_FOUND",a}var p=n[i]={exports:{}};e[i][0].call(p.exports,function(r){var n=e[i][1][r];return o(n||r)},p,p.exports,r,e,n,t)}return n[i].exports}for(var u="function"==typeof require&&require,i=0;i<t.length;i++)o(t[i]);return o}return r})()({1:[function(require,module,exports){
|
2022-05-17 01:25:05 +00:00
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.getDocumentMode = exports.isConforming = void 0;
|
|
|
|
const html_js_1 = require("./html.js");
|
2020-12-18 22:06:30 +00:00
|
|
|
//Const
|
|
|
|
const VALID_DOCTYPE_NAME = 'html';
|
|
|
|
const VALID_SYSTEM_ID = 'about:legacy-compat';
|
|
|
|
const QUIRKS_MODE_SYSTEM_ID = 'http://www.ibm.com/data/dtd/v11/ibmxhtml1-transitional.dtd';
|
|
|
|
const QUIRKS_MODE_PUBLIC_ID_PREFIXES = [
|
|
|
|
'+//silmaril//dtd html pro v0r11 19970101//',
|
|
|
|
'-//as//dtd html 3.0 aswedit + extensions//',
|
|
|
|
'-//advasoft ltd//dtd html 3.0 aswedit + extensions//',
|
|
|
|
'-//ietf//dtd html 2.0 level 1//',
|
|
|
|
'-//ietf//dtd html 2.0 level 2//',
|
|
|
|
'-//ietf//dtd html 2.0 strict level 1//',
|
|
|
|
'-//ietf//dtd html 2.0 strict level 2//',
|
|
|
|
'-//ietf//dtd html 2.0 strict//',
|
|
|
|
'-//ietf//dtd html 2.0//',
|
|
|
|
'-//ietf//dtd html 2.1e//',
|
|
|
|
'-//ietf//dtd html 3.0//',
|
|
|
|
'-//ietf//dtd html 3.2 final//',
|
|
|
|
'-//ietf//dtd html 3.2//',
|
|
|
|
'-//ietf//dtd html 3//',
|
|
|
|
'-//ietf//dtd html level 0//',
|
|
|
|
'-//ietf//dtd html level 1//',
|
|
|
|
'-//ietf//dtd html level 2//',
|
|
|
|
'-//ietf//dtd html level 3//',
|
|
|
|
'-//ietf//dtd html strict level 0//',
|
|
|
|
'-//ietf//dtd html strict level 1//',
|
|
|
|
'-//ietf//dtd html strict level 2//',
|
|
|
|
'-//ietf//dtd html strict level 3//',
|
|
|
|
'-//ietf//dtd html strict//',
|
|
|
|
'-//ietf//dtd html//',
|
|
|
|
'-//metrius//dtd metrius presentational//',
|
|
|
|
'-//microsoft//dtd internet explorer 2.0 html strict//',
|
|
|
|
'-//microsoft//dtd internet explorer 2.0 html//',
|
|
|
|
'-//microsoft//dtd internet explorer 2.0 tables//',
|
|
|
|
'-//microsoft//dtd internet explorer 3.0 html strict//',
|
|
|
|
'-//microsoft//dtd internet explorer 3.0 html//',
|
|
|
|
'-//microsoft//dtd internet explorer 3.0 tables//',
|
|
|
|
'-//netscape comm. corp.//dtd html//',
|
|
|
|
'-//netscape comm. corp.//dtd strict html//',
|
|
|
|
"-//o'reilly and associates//dtd html 2.0//",
|
|
|
|
"-//o'reilly and associates//dtd html extended 1.0//",
|
|
|
|
"-//o'reilly and associates//dtd html extended relaxed 1.0//",
|
|
|
|
'-//sq//dtd html 2.0 hotmetal + extensions//',
|
|
|
|
'-//softquad software//dtd hotmetal pro 6.0::19990601::extensions to html 4.0//',
|
|
|
|
'-//softquad//dtd hotmetal pro 4.0::19971010::extensions to html 4.0//',
|
|
|
|
'-//spyglass//dtd html 2.0 extended//',
|
|
|
|
'-//sun microsystems corp.//dtd hotjava html//',
|
|
|
|
'-//sun microsystems corp.//dtd hotjava strict html//',
|
|
|
|
'-//w3c//dtd html 3 1995-03-24//',
|
|
|
|
'-//w3c//dtd html 3.2 draft//',
|
|
|
|
'-//w3c//dtd html 3.2 final//',
|
|
|
|
'-//w3c//dtd html 3.2//',
|
|
|
|
'-//w3c//dtd html 3.2s draft//',
|
|
|
|
'-//w3c//dtd html 4.0 frameset//',
|
|
|
|
'-//w3c//dtd html 4.0 transitional//',
|
|
|
|
'-//w3c//dtd html experimental 19960712//',
|
|
|
|
'-//w3c//dtd html experimental 970421//',
|
|
|
|
'-//w3c//dtd w3 html//',
|
|
|
|
'-//w3o//dtd w3 html 3.0//',
|
|
|
|
'-//webtechs//dtd mozilla html 2.0//',
|
2022-05-17 01:25:05 +00:00
|
|
|
'-//webtechs//dtd mozilla html//',
|
2020-12-18 22:06:30 +00:00
|
|
|
];
|
2022-05-17 01:25:05 +00:00
|
|
|
const QUIRKS_MODE_NO_SYSTEM_ID_PUBLIC_ID_PREFIXES = [
|
|
|
|
...QUIRKS_MODE_PUBLIC_ID_PREFIXES,
|
2020-12-18 22:06:30 +00:00
|
|
|
'-//w3c//dtd html 4.01 frameset//',
|
2022-05-17 01:25:05 +00:00
|
|
|
'-//w3c//dtd html 4.01 transitional//',
|
|
|
|
];
|
|
|
|
const QUIRKS_MODE_PUBLIC_IDS = new Set([
|
|
|
|
'-//w3o//dtd w3 html strict 3.0//en//',
|
|
|
|
'-/w3c/dtd html 4.0 transitional/en',
|
|
|
|
'html',
|
2020-12-18 22:06:30 +00:00
|
|
|
]);
|
|
|
|
const LIMITED_QUIRKS_PUBLIC_ID_PREFIXES = ['-//w3c//dtd xhtml 1.0 frameset//', '-//w3c//dtd xhtml 1.0 transitional//'];
|
2022-05-17 01:25:05 +00:00
|
|
|
const LIMITED_QUIRKS_WITH_SYSTEM_ID_PUBLIC_ID_PREFIXES = [
|
|
|
|
...LIMITED_QUIRKS_PUBLIC_ID_PREFIXES,
|
2020-12-18 22:06:30 +00:00
|
|
|
'-//w3c//dtd html 4.01 frameset//',
|
2022-05-17 01:25:05 +00:00
|
|
|
'-//w3c//dtd html 4.01 transitional//',
|
|
|
|
];
|
2020-12-18 22:06:30 +00:00
|
|
|
//Utils
|
|
|
|
function hasPrefix(publicId, prefixes) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return prefixes.some((prefix) => publicId.startsWith(prefix));
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//API
|
2022-05-17 01:25:05 +00:00
|
|
|
function isConforming(token) {
|
|
|
|
return (token.name === VALID_DOCTYPE_NAME &&
|
2020-12-18 22:06:30 +00:00
|
|
|
token.publicId === null &&
|
2022-05-17 01:25:05 +00:00
|
|
|
(token.systemId === null || token.systemId === VALID_SYSTEM_ID));
|
|
|
|
}
|
|
|
|
exports.isConforming = isConforming;
|
|
|
|
function getDocumentMode(token) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (token.name !== VALID_DOCTYPE_NAME) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return html_js_1.DOCUMENT_MODE.QUIRKS;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
const { systemId } = token;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (systemId && systemId.toLowerCase() === QUIRKS_MODE_SYSTEM_ID) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return html_js_1.DOCUMENT_MODE.QUIRKS;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
let { publicId } = token;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (publicId !== null) {
|
|
|
|
publicId = publicId.toLowerCase();
|
2022-05-17 01:25:05 +00:00
|
|
|
if (QUIRKS_MODE_PUBLIC_IDS.has(publicId)) {
|
|
|
|
return html_js_1.DOCUMENT_MODE.QUIRKS;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
let prefixes = systemId === null ? QUIRKS_MODE_NO_SYSTEM_ID_PUBLIC_ID_PREFIXES : QUIRKS_MODE_PUBLIC_ID_PREFIXES;
|
|
|
|
if (hasPrefix(publicId, prefixes)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return html_js_1.DOCUMENT_MODE.QUIRKS;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
prefixes =
|
|
|
|
systemId === null ? LIMITED_QUIRKS_PUBLIC_ID_PREFIXES : LIMITED_QUIRKS_WITH_SYSTEM_ID_PUBLIC_ID_PREFIXES;
|
|
|
|
if (hasPrefix(publicId, prefixes)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return html_js_1.DOCUMENT_MODE.LIMITED_QUIRKS;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return html_js_1.DOCUMENT_MODE.NO_QUIRKS;
|
|
|
|
}
|
|
|
|
exports.getDocumentMode = getDocumentMode;
|
|
|
|
|
|
|
|
},{"./html.js":4}],2:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.ERR = void 0;
|
|
|
|
var ERR;
|
|
|
|
(function (ERR) {
|
|
|
|
ERR["controlCharacterInInputStream"] = "control-character-in-input-stream";
|
|
|
|
ERR["noncharacterInInputStream"] = "noncharacter-in-input-stream";
|
|
|
|
ERR["surrogateInInputStream"] = "surrogate-in-input-stream";
|
|
|
|
ERR["nonVoidHtmlElementStartTagWithTrailingSolidus"] = "non-void-html-element-start-tag-with-trailing-solidus";
|
|
|
|
ERR["endTagWithAttributes"] = "end-tag-with-attributes";
|
|
|
|
ERR["endTagWithTrailingSolidus"] = "end-tag-with-trailing-solidus";
|
|
|
|
ERR["unexpectedSolidusInTag"] = "unexpected-solidus-in-tag";
|
|
|
|
ERR["unexpectedNullCharacter"] = "unexpected-null-character";
|
|
|
|
ERR["unexpectedQuestionMarkInsteadOfTagName"] = "unexpected-question-mark-instead-of-tag-name";
|
|
|
|
ERR["invalidFirstCharacterOfTagName"] = "invalid-first-character-of-tag-name";
|
|
|
|
ERR["unexpectedEqualsSignBeforeAttributeName"] = "unexpected-equals-sign-before-attribute-name";
|
|
|
|
ERR["missingEndTagName"] = "missing-end-tag-name";
|
|
|
|
ERR["unexpectedCharacterInAttributeName"] = "unexpected-character-in-attribute-name";
|
|
|
|
ERR["unknownNamedCharacterReference"] = "unknown-named-character-reference";
|
|
|
|
ERR["missingSemicolonAfterCharacterReference"] = "missing-semicolon-after-character-reference";
|
|
|
|
ERR["unexpectedCharacterAfterDoctypeSystemIdentifier"] = "unexpected-character-after-doctype-system-identifier";
|
|
|
|
ERR["unexpectedCharacterInUnquotedAttributeValue"] = "unexpected-character-in-unquoted-attribute-value";
|
|
|
|
ERR["eofBeforeTagName"] = "eof-before-tag-name";
|
|
|
|
ERR["eofInTag"] = "eof-in-tag";
|
|
|
|
ERR["missingAttributeValue"] = "missing-attribute-value";
|
|
|
|
ERR["missingWhitespaceBetweenAttributes"] = "missing-whitespace-between-attributes";
|
|
|
|
ERR["missingWhitespaceAfterDoctypePublicKeyword"] = "missing-whitespace-after-doctype-public-keyword";
|
|
|
|
ERR["missingWhitespaceBetweenDoctypePublicAndSystemIdentifiers"] = "missing-whitespace-between-doctype-public-and-system-identifiers";
|
|
|
|
ERR["missingWhitespaceAfterDoctypeSystemKeyword"] = "missing-whitespace-after-doctype-system-keyword";
|
|
|
|
ERR["missingQuoteBeforeDoctypePublicIdentifier"] = "missing-quote-before-doctype-public-identifier";
|
|
|
|
ERR["missingQuoteBeforeDoctypeSystemIdentifier"] = "missing-quote-before-doctype-system-identifier";
|
|
|
|
ERR["missingDoctypePublicIdentifier"] = "missing-doctype-public-identifier";
|
|
|
|
ERR["missingDoctypeSystemIdentifier"] = "missing-doctype-system-identifier";
|
|
|
|
ERR["abruptDoctypePublicIdentifier"] = "abrupt-doctype-public-identifier";
|
|
|
|
ERR["abruptDoctypeSystemIdentifier"] = "abrupt-doctype-system-identifier";
|
|
|
|
ERR["cdataInHtmlContent"] = "cdata-in-html-content";
|
|
|
|
ERR["incorrectlyOpenedComment"] = "incorrectly-opened-comment";
|
|
|
|
ERR["eofInScriptHtmlCommentLikeText"] = "eof-in-script-html-comment-like-text";
|
|
|
|
ERR["eofInDoctype"] = "eof-in-doctype";
|
|
|
|
ERR["nestedComment"] = "nested-comment";
|
|
|
|
ERR["abruptClosingOfEmptyComment"] = "abrupt-closing-of-empty-comment";
|
|
|
|
ERR["eofInComment"] = "eof-in-comment";
|
|
|
|
ERR["incorrectlyClosedComment"] = "incorrectly-closed-comment";
|
|
|
|
ERR["eofInCdata"] = "eof-in-cdata";
|
|
|
|
ERR["absenceOfDigitsInNumericCharacterReference"] = "absence-of-digits-in-numeric-character-reference";
|
|
|
|
ERR["nullCharacterReference"] = "null-character-reference";
|
|
|
|
ERR["surrogateCharacterReference"] = "surrogate-character-reference";
|
|
|
|
ERR["characterReferenceOutsideUnicodeRange"] = "character-reference-outside-unicode-range";
|
|
|
|
ERR["controlCharacterReference"] = "control-character-reference";
|
|
|
|
ERR["noncharacterCharacterReference"] = "noncharacter-character-reference";
|
|
|
|
ERR["missingWhitespaceBeforeDoctypeName"] = "missing-whitespace-before-doctype-name";
|
|
|
|
ERR["missingDoctypeName"] = "missing-doctype-name";
|
|
|
|
ERR["invalidCharacterSequenceAfterDoctypeName"] = "invalid-character-sequence-after-doctype-name";
|
|
|
|
ERR["duplicateAttribute"] = "duplicate-attribute";
|
|
|
|
ERR["nonConformingDoctype"] = "non-conforming-doctype";
|
|
|
|
ERR["missingDoctype"] = "missing-doctype";
|
|
|
|
ERR["misplacedDoctype"] = "misplaced-doctype";
|
|
|
|
ERR["endTagWithoutMatchingOpenElement"] = "end-tag-without-matching-open-element";
|
|
|
|
ERR["closingOfElementWithOpenChildElements"] = "closing-of-element-with-open-child-elements";
|
|
|
|
ERR["disallowedContentInNoscriptInHead"] = "disallowed-content-in-noscript-in-head";
|
|
|
|
ERR["openElementsLeftAfterEof"] = "open-elements-left-after-eof";
|
|
|
|
ERR["abandonedHeadElementChild"] = "abandoned-head-element-child";
|
|
|
|
ERR["misplacedStartTagForHeadElement"] = "misplaced-start-tag-for-head-element";
|
|
|
|
ERR["nestedNoscriptInHead"] = "nested-noscript-in-head";
|
|
|
|
ERR["eofInElementThatCanContainOnlyText"] = "eof-in-element-that-can-contain-only-text";
|
|
|
|
})(ERR = exports.ERR || (exports.ERR = {}));
|
2020-12-18 22:06:30 +00:00
|
|
|
|
|
|
|
},{}],3:[function(require,module,exports){
|
2022-05-17 01:25:05 +00:00
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.isIntegrationPoint = exports.adjustTokenSVGTagName = exports.adjustTokenXMLAttrs = exports.adjustTokenSVGAttrs = exports.adjustTokenMathMLAttrs = exports.causesExit = exports.SVG_TAG_NAMES_ADJUSTMENT_MAP = void 0;
|
|
|
|
const html_js_1 = require("./html.js");
|
2020-12-18 22:06:30 +00:00
|
|
|
//MIME types
|
|
|
|
const MIME_TYPES = {
|
|
|
|
TEXT_HTML: 'text/html',
|
2022-05-17 01:25:05 +00:00
|
|
|
APPLICATION_XML: 'application/xhtml+xml',
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
|
|
|
//Attributes
|
|
|
|
const DEFINITION_URL_ATTR = 'definitionurl';
|
|
|
|
const ADJUSTED_DEFINITION_URL_ATTR = 'definitionURL';
|
2022-05-17 01:25:05 +00:00
|
|
|
const SVG_ATTRS_ADJUSTMENT_MAP = new Map([
|
|
|
|
'attributeName',
|
|
|
|
'attributeType',
|
|
|
|
'baseFrequency',
|
|
|
|
'baseProfile',
|
|
|
|
'calcMode',
|
|
|
|
'clipPathUnits',
|
|
|
|
'diffuseConstant',
|
|
|
|
'edgeMode',
|
|
|
|
'filterUnits',
|
|
|
|
'glyphRef',
|
|
|
|
'gradientTransform',
|
|
|
|
'gradientUnits',
|
|
|
|
'kernelMatrix',
|
|
|
|
'kernelUnitLength',
|
|
|
|
'keyPoints',
|
|
|
|
'keySplines',
|
|
|
|
'keyTimes',
|
|
|
|
'lengthAdjust',
|
|
|
|
'limitingConeAngle',
|
|
|
|
'markerHeight',
|
|
|
|
'markerUnits',
|
|
|
|
'markerWidth',
|
|
|
|
'maskContentUnits',
|
|
|
|
'maskUnits',
|
|
|
|
'numOctaves',
|
|
|
|
'pathLength',
|
|
|
|
'patternContentUnits',
|
|
|
|
'patternTransform',
|
|
|
|
'patternUnits',
|
|
|
|
'pointsAtX',
|
|
|
|
'pointsAtY',
|
|
|
|
'pointsAtZ',
|
|
|
|
'preserveAlpha',
|
|
|
|
'preserveAspectRatio',
|
|
|
|
'primitiveUnits',
|
|
|
|
'refX',
|
|
|
|
'refY',
|
|
|
|
'repeatCount',
|
|
|
|
'repeatDur',
|
|
|
|
'requiredExtensions',
|
|
|
|
'requiredFeatures',
|
|
|
|
'specularConstant',
|
|
|
|
'specularExponent',
|
|
|
|
'spreadMethod',
|
|
|
|
'startOffset',
|
|
|
|
'stdDeviation',
|
|
|
|
'stitchTiles',
|
|
|
|
'surfaceScale',
|
|
|
|
'systemLanguage',
|
|
|
|
'tableValues',
|
|
|
|
'targetX',
|
|
|
|
'targetY',
|
|
|
|
'textLength',
|
|
|
|
'viewBox',
|
|
|
|
'viewTarget',
|
|
|
|
'xChannelSelector',
|
|
|
|
'yChannelSelector',
|
|
|
|
'zoomAndPan',
|
|
|
|
].map((attr) => [attr.toLowerCase(), attr]));
|
|
|
|
const XML_ATTRS_ADJUSTMENT_MAP = new Map([
|
|
|
|
['xlink:actuate', { prefix: 'xlink', name: 'actuate', namespace: html_js_1.NS.XLINK }],
|
|
|
|
['xlink:arcrole', { prefix: 'xlink', name: 'arcrole', namespace: html_js_1.NS.XLINK }],
|
|
|
|
['xlink:href', { prefix: 'xlink', name: 'href', namespace: html_js_1.NS.XLINK }],
|
|
|
|
['xlink:role', { prefix: 'xlink', name: 'role', namespace: html_js_1.NS.XLINK }],
|
|
|
|
['xlink:show', { prefix: 'xlink', name: 'show', namespace: html_js_1.NS.XLINK }],
|
|
|
|
['xlink:title', { prefix: 'xlink', name: 'title', namespace: html_js_1.NS.XLINK }],
|
|
|
|
['xlink:type', { prefix: 'xlink', name: 'type', namespace: html_js_1.NS.XLINK }],
|
|
|
|
['xml:base', { prefix: 'xml', name: 'base', namespace: html_js_1.NS.XML }],
|
|
|
|
['xml:lang', { prefix: 'xml', name: 'lang', namespace: html_js_1.NS.XML }],
|
|
|
|
['xml:space', { prefix: 'xml', name: 'space', namespace: html_js_1.NS.XML }],
|
|
|
|
['xmlns', { prefix: '', name: 'xmlns', namespace: html_js_1.NS.XMLNS }],
|
|
|
|
['xmlns:xlink', { prefix: 'xmlns', name: 'xlink', namespace: html_js_1.NS.XMLNS }],
|
|
|
|
]);
|
2020-12-18 22:06:30 +00:00
|
|
|
//SVG tag names adjustment map
|
2022-05-17 01:25:05 +00:00
|
|
|
exports.SVG_TAG_NAMES_ADJUSTMENT_MAP = new Map([
|
|
|
|
'altGlyph',
|
|
|
|
'altGlyphDef',
|
|
|
|
'altGlyphItem',
|
|
|
|
'animateColor',
|
|
|
|
'animateMotion',
|
|
|
|
'animateTransform',
|
|
|
|
'clipPath',
|
|
|
|
'feBlend',
|
|
|
|
'feColorMatrix',
|
|
|
|
'feComponentTransfer',
|
|
|
|
'feComposite',
|
|
|
|
'feConvolveMatrix',
|
|
|
|
'feDiffuseLighting',
|
|
|
|
'feDisplacementMap',
|
|
|
|
'feDistantLight',
|
|
|
|
'feFlood',
|
|
|
|
'feFuncA',
|
|
|
|
'feFuncB',
|
|
|
|
'feFuncG',
|
|
|
|
'feFuncR',
|
|
|
|
'feGaussianBlur',
|
|
|
|
'feImage',
|
|
|
|
'feMerge',
|
|
|
|
'feMergeNode',
|
|
|
|
'feMorphology',
|
|
|
|
'feOffset',
|
|
|
|
'fePointLight',
|
|
|
|
'feSpecularLighting',
|
|
|
|
'feSpotLight',
|
|
|
|
'feTile',
|
|
|
|
'feTurbulence',
|
|
|
|
'foreignObject',
|
|
|
|
'glyphRef',
|
|
|
|
'linearGradient',
|
|
|
|
'radialGradient',
|
|
|
|
'textPath',
|
|
|
|
].map((tn) => [tn.toLowerCase(), tn]));
|
2020-12-18 22:06:30 +00:00
|
|
|
//Tags that causes exit from foreign content
|
2022-05-17 01:25:05 +00:00
|
|
|
const EXITS_FOREIGN_CONTENT = new Set([
|
|
|
|
html_js_1.TAG_ID.B,
|
|
|
|
html_js_1.TAG_ID.BIG,
|
|
|
|
html_js_1.TAG_ID.BLOCKQUOTE,
|
|
|
|
html_js_1.TAG_ID.BODY,
|
|
|
|
html_js_1.TAG_ID.BR,
|
|
|
|
html_js_1.TAG_ID.CENTER,
|
|
|
|
html_js_1.TAG_ID.CODE,
|
|
|
|
html_js_1.TAG_ID.DD,
|
|
|
|
html_js_1.TAG_ID.DIV,
|
|
|
|
html_js_1.TAG_ID.DL,
|
|
|
|
html_js_1.TAG_ID.DT,
|
|
|
|
html_js_1.TAG_ID.EM,
|
|
|
|
html_js_1.TAG_ID.EMBED,
|
|
|
|
html_js_1.TAG_ID.H1,
|
|
|
|
html_js_1.TAG_ID.H2,
|
|
|
|
html_js_1.TAG_ID.H3,
|
|
|
|
html_js_1.TAG_ID.H4,
|
|
|
|
html_js_1.TAG_ID.H5,
|
|
|
|
html_js_1.TAG_ID.H6,
|
|
|
|
html_js_1.TAG_ID.HEAD,
|
|
|
|
html_js_1.TAG_ID.HR,
|
|
|
|
html_js_1.TAG_ID.I,
|
|
|
|
html_js_1.TAG_ID.IMG,
|
|
|
|
html_js_1.TAG_ID.LI,
|
|
|
|
html_js_1.TAG_ID.LISTING,
|
|
|
|
html_js_1.TAG_ID.MENU,
|
|
|
|
html_js_1.TAG_ID.META,
|
|
|
|
html_js_1.TAG_ID.NOBR,
|
|
|
|
html_js_1.TAG_ID.OL,
|
|
|
|
html_js_1.TAG_ID.P,
|
|
|
|
html_js_1.TAG_ID.PRE,
|
|
|
|
html_js_1.TAG_ID.RUBY,
|
|
|
|
html_js_1.TAG_ID.S,
|
|
|
|
html_js_1.TAG_ID.SMALL,
|
|
|
|
html_js_1.TAG_ID.SPAN,
|
|
|
|
html_js_1.TAG_ID.STRONG,
|
|
|
|
html_js_1.TAG_ID.STRIKE,
|
|
|
|
html_js_1.TAG_ID.SUB,
|
|
|
|
html_js_1.TAG_ID.SUP,
|
|
|
|
html_js_1.TAG_ID.TABLE,
|
|
|
|
html_js_1.TAG_ID.TT,
|
|
|
|
html_js_1.TAG_ID.U,
|
|
|
|
html_js_1.TAG_ID.UL,
|
|
|
|
html_js_1.TAG_ID.VAR,
|
|
|
|
]);
|
2020-12-18 22:06:30 +00:00
|
|
|
//Check exit from foreign content
|
2022-05-17 01:25:05 +00:00
|
|
|
function causesExit(startTagToken) {
|
|
|
|
const tn = startTagToken.tagID;
|
|
|
|
const isFontWithAttrs = tn === html_js_1.TAG_ID.FONT &&
|
|
|
|
startTagToken.attrs.some(({ name }) => name === html_js_1.ATTRS.COLOR || name === html_js_1.ATTRS.SIZE || name === html_js_1.ATTRS.FACE);
|
|
|
|
return isFontWithAttrs || EXITS_FOREIGN_CONTENT.has(tn);
|
|
|
|
}
|
|
|
|
exports.causesExit = causesExit;
|
2020-12-18 22:06:30 +00:00
|
|
|
//Token adjustments
|
2022-05-17 01:25:05 +00:00
|
|
|
function adjustTokenMathMLAttrs(token) {
|
2020-12-18 22:06:30 +00:00
|
|
|
for (let i = 0; i < token.attrs.length; i++) {
|
|
|
|
if (token.attrs[i].name === DEFINITION_URL_ATTR) {
|
|
|
|
token.attrs[i].name = ADJUSTED_DEFINITION_URL_ATTR;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
exports.adjustTokenMathMLAttrs = adjustTokenMathMLAttrs;
|
|
|
|
function adjustTokenSVGAttrs(token) {
|
2020-12-18 22:06:30 +00:00
|
|
|
for (let i = 0; i < token.attrs.length; i++) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const adjustedAttrName = SVG_ATTRS_ADJUSTMENT_MAP.get(token.attrs[i].name);
|
|
|
|
if (adjustedAttrName != null) {
|
2020-12-18 22:06:30 +00:00
|
|
|
token.attrs[i].name = adjustedAttrName;
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
exports.adjustTokenSVGAttrs = adjustTokenSVGAttrs;
|
|
|
|
function adjustTokenXMLAttrs(token) {
|
2020-12-18 22:06:30 +00:00
|
|
|
for (let i = 0; i < token.attrs.length; i++) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const adjustedAttrEntry = XML_ATTRS_ADJUSTMENT_MAP.get(token.attrs[i].name);
|
2020-12-18 22:06:30 +00:00
|
|
|
if (adjustedAttrEntry) {
|
|
|
|
token.attrs[i].prefix = adjustedAttrEntry.prefix;
|
|
|
|
token.attrs[i].name = adjustedAttrEntry.name;
|
|
|
|
token.attrs[i].namespace = adjustedAttrEntry.namespace;
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
exports.adjustTokenXMLAttrs = adjustTokenXMLAttrs;
|
|
|
|
function adjustTokenSVGTagName(token) {
|
|
|
|
const adjustedTagName = exports.SVG_TAG_NAMES_ADJUSTMENT_MAP.get(token.tagName);
|
|
|
|
if (adjustedTagName != null) {
|
2020-12-18 22:06:30 +00:00
|
|
|
token.tagName = adjustedTagName;
|
2022-05-17 01:25:05 +00:00
|
|
|
token.tagID = (0, html_js_1.getTagID)(token.tagName);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
exports.adjustTokenSVGTagName = adjustTokenSVGTagName;
|
2020-12-18 22:06:30 +00:00
|
|
|
//Integration points
|
|
|
|
function isMathMLTextIntegrationPoint(tn, ns) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return ns === html_js_1.NS.MATHML && (tn === html_js_1.TAG_ID.MI || tn === html_js_1.TAG_ID.MO || tn === html_js_1.TAG_ID.MN || tn === html_js_1.TAG_ID.MS || tn === html_js_1.TAG_ID.MTEXT);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function isHtmlIntegrationPoint(tn, ns, attrs) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (ns === html_js_1.NS.MATHML && tn === html_js_1.TAG_ID.ANNOTATION_XML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
for (let i = 0; i < attrs.length; i++) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (attrs[i].name === html_js_1.ATTRS.ENCODING) {
|
2020-12-18 22:06:30 +00:00
|
|
|
const value = attrs[i].value.toLowerCase();
|
|
|
|
return value === MIME_TYPES.TEXT_HTML || value === MIME_TYPES.APPLICATION_XML;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
return ns === html_js_1.NS.SVG && (tn === html_js_1.TAG_ID.FOREIGN_OBJECT || tn === html_js_1.TAG_ID.DESC || tn === html_js_1.TAG_ID.TITLE);
|
|
|
|
}
|
|
|
|
function isIntegrationPoint(tn, ns, attrs, foreignNS) {
|
|
|
|
return (((!foreignNS || foreignNS === html_js_1.NS.HTML) && isHtmlIntegrationPoint(tn, ns, attrs)) ||
|
|
|
|
((!foreignNS || foreignNS === html_js_1.NS.MATHML) && isMathMLTextIntegrationPoint(tn, ns)));
|
|
|
|
}
|
|
|
|
exports.isIntegrationPoint = isIntegrationPoint;
|
|
|
|
|
|
|
|
},{"./html.js":4}],4:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.hasUnescapedText = exports.isNumberedHeader = exports.SPECIAL_ELEMENTS = exports.getTagID = exports.TAG_ID = exports.TAG_NAMES = exports.DOCUMENT_MODE = exports.ATTRS = exports.NS = void 0;
|
|
|
|
/** All valid namespaces in HTML. */
|
|
|
|
var NS;
|
|
|
|
(function (NS) {
|
|
|
|
NS["HTML"] = "http://www.w3.org/1999/xhtml";
|
|
|
|
NS["MATHML"] = "http://www.w3.org/1998/Math/MathML";
|
|
|
|
NS["SVG"] = "http://www.w3.org/2000/svg";
|
|
|
|
NS["XLINK"] = "http://www.w3.org/1999/xlink";
|
|
|
|
NS["XML"] = "http://www.w3.org/XML/1998/namespace";
|
|
|
|
NS["XMLNS"] = "http://www.w3.org/2000/xmlns/";
|
|
|
|
})(NS = exports.NS || (exports.NS = {}));
|
|
|
|
var ATTRS;
|
|
|
|
(function (ATTRS) {
|
|
|
|
ATTRS["TYPE"] = "type";
|
|
|
|
ATTRS["ACTION"] = "action";
|
|
|
|
ATTRS["ENCODING"] = "encoding";
|
|
|
|
ATTRS["PROMPT"] = "prompt";
|
|
|
|
ATTRS["NAME"] = "name";
|
|
|
|
ATTRS["COLOR"] = "color";
|
|
|
|
ATTRS["FACE"] = "face";
|
|
|
|
ATTRS["SIZE"] = "size";
|
|
|
|
})(ATTRS = exports.ATTRS || (exports.ATTRS = {}));
|
|
|
|
/**
|
|
|
|
* The mode of the document.
|
|
|
|
*
|
|
|
|
* @see {@link https://dom.spec.whatwg.org/#concept-document-limited-quirks}
|
|
|
|
*/
|
|
|
|
var DOCUMENT_MODE;
|
|
|
|
(function (DOCUMENT_MODE) {
|
|
|
|
DOCUMENT_MODE["NO_QUIRKS"] = "no-quirks";
|
|
|
|
DOCUMENT_MODE["QUIRKS"] = "quirks";
|
|
|
|
DOCUMENT_MODE["LIMITED_QUIRKS"] = "limited-quirks";
|
|
|
|
})(DOCUMENT_MODE = exports.DOCUMENT_MODE || (exports.DOCUMENT_MODE = {}));
|
|
|
|
var TAG_NAMES;
|
|
|
|
(function (TAG_NAMES) {
|
|
|
|
TAG_NAMES["A"] = "a";
|
|
|
|
TAG_NAMES["ADDRESS"] = "address";
|
|
|
|
TAG_NAMES["ANNOTATION_XML"] = "annotation-xml";
|
|
|
|
TAG_NAMES["APPLET"] = "applet";
|
|
|
|
TAG_NAMES["AREA"] = "area";
|
|
|
|
TAG_NAMES["ARTICLE"] = "article";
|
|
|
|
TAG_NAMES["ASIDE"] = "aside";
|
|
|
|
TAG_NAMES["B"] = "b";
|
|
|
|
TAG_NAMES["BASE"] = "base";
|
|
|
|
TAG_NAMES["BASEFONT"] = "basefont";
|
|
|
|
TAG_NAMES["BGSOUND"] = "bgsound";
|
|
|
|
TAG_NAMES["BIG"] = "big";
|
|
|
|
TAG_NAMES["BLOCKQUOTE"] = "blockquote";
|
|
|
|
TAG_NAMES["BODY"] = "body";
|
|
|
|
TAG_NAMES["BR"] = "br";
|
|
|
|
TAG_NAMES["BUTTON"] = "button";
|
|
|
|
TAG_NAMES["CAPTION"] = "caption";
|
|
|
|
TAG_NAMES["CENTER"] = "center";
|
|
|
|
TAG_NAMES["CODE"] = "code";
|
|
|
|
TAG_NAMES["COL"] = "col";
|
|
|
|
TAG_NAMES["COLGROUP"] = "colgroup";
|
|
|
|
TAG_NAMES["DD"] = "dd";
|
|
|
|
TAG_NAMES["DESC"] = "desc";
|
|
|
|
TAG_NAMES["DETAILS"] = "details";
|
|
|
|
TAG_NAMES["DIALOG"] = "dialog";
|
|
|
|
TAG_NAMES["DIR"] = "dir";
|
|
|
|
TAG_NAMES["DIV"] = "div";
|
|
|
|
TAG_NAMES["DL"] = "dl";
|
|
|
|
TAG_NAMES["DT"] = "dt";
|
|
|
|
TAG_NAMES["EM"] = "em";
|
|
|
|
TAG_NAMES["EMBED"] = "embed";
|
|
|
|
TAG_NAMES["FIELDSET"] = "fieldset";
|
|
|
|
TAG_NAMES["FIGCAPTION"] = "figcaption";
|
|
|
|
TAG_NAMES["FIGURE"] = "figure";
|
|
|
|
TAG_NAMES["FONT"] = "font";
|
|
|
|
TAG_NAMES["FOOTER"] = "footer";
|
|
|
|
TAG_NAMES["FOREIGN_OBJECT"] = "foreignObject";
|
|
|
|
TAG_NAMES["FORM"] = "form";
|
|
|
|
TAG_NAMES["FRAME"] = "frame";
|
|
|
|
TAG_NAMES["FRAMESET"] = "frameset";
|
|
|
|
TAG_NAMES["H1"] = "h1";
|
|
|
|
TAG_NAMES["H2"] = "h2";
|
|
|
|
TAG_NAMES["H3"] = "h3";
|
|
|
|
TAG_NAMES["H4"] = "h4";
|
|
|
|
TAG_NAMES["H5"] = "h5";
|
|
|
|
TAG_NAMES["H6"] = "h6";
|
|
|
|
TAG_NAMES["HEAD"] = "head";
|
|
|
|
TAG_NAMES["HEADER"] = "header";
|
|
|
|
TAG_NAMES["HGROUP"] = "hgroup";
|
|
|
|
TAG_NAMES["HR"] = "hr";
|
|
|
|
TAG_NAMES["HTML"] = "html";
|
|
|
|
TAG_NAMES["I"] = "i";
|
|
|
|
TAG_NAMES["IMG"] = "img";
|
|
|
|
TAG_NAMES["IMAGE"] = "image";
|
|
|
|
TAG_NAMES["INPUT"] = "input";
|
|
|
|
TAG_NAMES["IFRAME"] = "iframe";
|
|
|
|
TAG_NAMES["KEYGEN"] = "keygen";
|
|
|
|
TAG_NAMES["LABEL"] = "label";
|
|
|
|
TAG_NAMES["LI"] = "li";
|
|
|
|
TAG_NAMES["LINK"] = "link";
|
|
|
|
TAG_NAMES["LISTING"] = "listing";
|
|
|
|
TAG_NAMES["MAIN"] = "main";
|
|
|
|
TAG_NAMES["MALIGNMARK"] = "malignmark";
|
|
|
|
TAG_NAMES["MARQUEE"] = "marquee";
|
|
|
|
TAG_NAMES["MATH"] = "math";
|
|
|
|
TAG_NAMES["MENU"] = "menu";
|
|
|
|
TAG_NAMES["META"] = "meta";
|
|
|
|
TAG_NAMES["MGLYPH"] = "mglyph";
|
|
|
|
TAG_NAMES["MI"] = "mi";
|
|
|
|
TAG_NAMES["MO"] = "mo";
|
|
|
|
TAG_NAMES["MN"] = "mn";
|
|
|
|
TAG_NAMES["MS"] = "ms";
|
|
|
|
TAG_NAMES["MTEXT"] = "mtext";
|
|
|
|
TAG_NAMES["NAV"] = "nav";
|
|
|
|
TAG_NAMES["NOBR"] = "nobr";
|
|
|
|
TAG_NAMES["NOFRAMES"] = "noframes";
|
|
|
|
TAG_NAMES["NOEMBED"] = "noembed";
|
|
|
|
TAG_NAMES["NOSCRIPT"] = "noscript";
|
|
|
|
TAG_NAMES["OBJECT"] = "object";
|
|
|
|
TAG_NAMES["OL"] = "ol";
|
|
|
|
TAG_NAMES["OPTGROUP"] = "optgroup";
|
|
|
|
TAG_NAMES["OPTION"] = "option";
|
|
|
|
TAG_NAMES["P"] = "p";
|
|
|
|
TAG_NAMES["PARAM"] = "param";
|
|
|
|
TAG_NAMES["PLAINTEXT"] = "plaintext";
|
|
|
|
TAG_NAMES["PRE"] = "pre";
|
|
|
|
TAG_NAMES["RB"] = "rb";
|
|
|
|
TAG_NAMES["RP"] = "rp";
|
|
|
|
TAG_NAMES["RT"] = "rt";
|
|
|
|
TAG_NAMES["RTC"] = "rtc";
|
|
|
|
TAG_NAMES["RUBY"] = "ruby";
|
|
|
|
TAG_NAMES["S"] = "s";
|
|
|
|
TAG_NAMES["SCRIPT"] = "script";
|
|
|
|
TAG_NAMES["SECTION"] = "section";
|
|
|
|
TAG_NAMES["SELECT"] = "select";
|
|
|
|
TAG_NAMES["SOURCE"] = "source";
|
|
|
|
TAG_NAMES["SMALL"] = "small";
|
|
|
|
TAG_NAMES["SPAN"] = "span";
|
|
|
|
TAG_NAMES["STRIKE"] = "strike";
|
|
|
|
TAG_NAMES["STRONG"] = "strong";
|
|
|
|
TAG_NAMES["STYLE"] = "style";
|
|
|
|
TAG_NAMES["SUB"] = "sub";
|
|
|
|
TAG_NAMES["SUMMARY"] = "summary";
|
|
|
|
TAG_NAMES["SUP"] = "sup";
|
|
|
|
TAG_NAMES["TABLE"] = "table";
|
|
|
|
TAG_NAMES["TBODY"] = "tbody";
|
|
|
|
TAG_NAMES["TEMPLATE"] = "template";
|
|
|
|
TAG_NAMES["TEXTAREA"] = "textarea";
|
|
|
|
TAG_NAMES["TFOOT"] = "tfoot";
|
|
|
|
TAG_NAMES["TD"] = "td";
|
|
|
|
TAG_NAMES["TH"] = "th";
|
|
|
|
TAG_NAMES["THEAD"] = "thead";
|
|
|
|
TAG_NAMES["TITLE"] = "title";
|
|
|
|
TAG_NAMES["TR"] = "tr";
|
|
|
|
TAG_NAMES["TRACK"] = "track";
|
|
|
|
TAG_NAMES["TT"] = "tt";
|
|
|
|
TAG_NAMES["U"] = "u";
|
|
|
|
TAG_NAMES["UL"] = "ul";
|
|
|
|
TAG_NAMES["SVG"] = "svg";
|
|
|
|
TAG_NAMES["VAR"] = "var";
|
|
|
|
TAG_NAMES["WBR"] = "wbr";
|
|
|
|
TAG_NAMES["XMP"] = "xmp";
|
|
|
|
})(TAG_NAMES = exports.TAG_NAMES || (exports.TAG_NAMES = {}));
|
|
|
|
/**
|
|
|
|
* Tag IDs are numeric IDs for known tag names.
|
|
|
|
*
|
|
|
|
* We use tag IDs to improve the performance of tag name comparisons.
|
|
|
|
*/
|
|
|
|
var TAG_ID;
|
|
|
|
(function (TAG_ID) {
|
|
|
|
TAG_ID[TAG_ID["UNKNOWN"] = 0] = "UNKNOWN";
|
|
|
|
TAG_ID[TAG_ID["A"] = 1] = "A";
|
|
|
|
TAG_ID[TAG_ID["ADDRESS"] = 2] = "ADDRESS";
|
|
|
|
TAG_ID[TAG_ID["ANNOTATION_XML"] = 3] = "ANNOTATION_XML";
|
|
|
|
TAG_ID[TAG_ID["APPLET"] = 4] = "APPLET";
|
|
|
|
TAG_ID[TAG_ID["AREA"] = 5] = "AREA";
|
|
|
|
TAG_ID[TAG_ID["ARTICLE"] = 6] = "ARTICLE";
|
|
|
|
TAG_ID[TAG_ID["ASIDE"] = 7] = "ASIDE";
|
|
|
|
TAG_ID[TAG_ID["B"] = 8] = "B";
|
|
|
|
TAG_ID[TAG_ID["BASE"] = 9] = "BASE";
|
|
|
|
TAG_ID[TAG_ID["BASEFONT"] = 10] = "BASEFONT";
|
|
|
|
TAG_ID[TAG_ID["BGSOUND"] = 11] = "BGSOUND";
|
|
|
|
TAG_ID[TAG_ID["BIG"] = 12] = "BIG";
|
|
|
|
TAG_ID[TAG_ID["BLOCKQUOTE"] = 13] = "BLOCKQUOTE";
|
|
|
|
TAG_ID[TAG_ID["BODY"] = 14] = "BODY";
|
|
|
|
TAG_ID[TAG_ID["BR"] = 15] = "BR";
|
|
|
|
TAG_ID[TAG_ID["BUTTON"] = 16] = "BUTTON";
|
|
|
|
TAG_ID[TAG_ID["CAPTION"] = 17] = "CAPTION";
|
|
|
|
TAG_ID[TAG_ID["CENTER"] = 18] = "CENTER";
|
|
|
|
TAG_ID[TAG_ID["CODE"] = 19] = "CODE";
|
|
|
|
TAG_ID[TAG_ID["COL"] = 20] = "COL";
|
|
|
|
TAG_ID[TAG_ID["COLGROUP"] = 21] = "COLGROUP";
|
|
|
|
TAG_ID[TAG_ID["DD"] = 22] = "DD";
|
|
|
|
TAG_ID[TAG_ID["DESC"] = 23] = "DESC";
|
|
|
|
TAG_ID[TAG_ID["DETAILS"] = 24] = "DETAILS";
|
|
|
|
TAG_ID[TAG_ID["DIALOG"] = 25] = "DIALOG";
|
|
|
|
TAG_ID[TAG_ID["DIR"] = 26] = "DIR";
|
|
|
|
TAG_ID[TAG_ID["DIV"] = 27] = "DIV";
|
|
|
|
TAG_ID[TAG_ID["DL"] = 28] = "DL";
|
|
|
|
TAG_ID[TAG_ID["DT"] = 29] = "DT";
|
|
|
|
TAG_ID[TAG_ID["EM"] = 30] = "EM";
|
|
|
|
TAG_ID[TAG_ID["EMBED"] = 31] = "EMBED";
|
|
|
|
TAG_ID[TAG_ID["FIELDSET"] = 32] = "FIELDSET";
|
|
|
|
TAG_ID[TAG_ID["FIGCAPTION"] = 33] = "FIGCAPTION";
|
|
|
|
TAG_ID[TAG_ID["FIGURE"] = 34] = "FIGURE";
|
|
|
|
TAG_ID[TAG_ID["FONT"] = 35] = "FONT";
|
|
|
|
TAG_ID[TAG_ID["FOOTER"] = 36] = "FOOTER";
|
|
|
|
TAG_ID[TAG_ID["FOREIGN_OBJECT"] = 37] = "FOREIGN_OBJECT";
|
|
|
|
TAG_ID[TAG_ID["FORM"] = 38] = "FORM";
|
|
|
|
TAG_ID[TAG_ID["FRAME"] = 39] = "FRAME";
|
|
|
|
TAG_ID[TAG_ID["FRAMESET"] = 40] = "FRAMESET";
|
|
|
|
TAG_ID[TAG_ID["H1"] = 41] = "H1";
|
|
|
|
TAG_ID[TAG_ID["H2"] = 42] = "H2";
|
|
|
|
TAG_ID[TAG_ID["H3"] = 43] = "H3";
|
|
|
|
TAG_ID[TAG_ID["H4"] = 44] = "H4";
|
|
|
|
TAG_ID[TAG_ID["H5"] = 45] = "H5";
|
|
|
|
TAG_ID[TAG_ID["H6"] = 46] = "H6";
|
|
|
|
TAG_ID[TAG_ID["HEAD"] = 47] = "HEAD";
|
|
|
|
TAG_ID[TAG_ID["HEADER"] = 48] = "HEADER";
|
|
|
|
TAG_ID[TAG_ID["HGROUP"] = 49] = "HGROUP";
|
|
|
|
TAG_ID[TAG_ID["HR"] = 50] = "HR";
|
|
|
|
TAG_ID[TAG_ID["HTML"] = 51] = "HTML";
|
|
|
|
TAG_ID[TAG_ID["I"] = 52] = "I";
|
|
|
|
TAG_ID[TAG_ID["IMG"] = 53] = "IMG";
|
|
|
|
TAG_ID[TAG_ID["IMAGE"] = 54] = "IMAGE";
|
|
|
|
TAG_ID[TAG_ID["INPUT"] = 55] = "INPUT";
|
|
|
|
TAG_ID[TAG_ID["IFRAME"] = 56] = "IFRAME";
|
|
|
|
TAG_ID[TAG_ID["KEYGEN"] = 57] = "KEYGEN";
|
|
|
|
TAG_ID[TAG_ID["LABEL"] = 58] = "LABEL";
|
|
|
|
TAG_ID[TAG_ID["LI"] = 59] = "LI";
|
|
|
|
TAG_ID[TAG_ID["LINK"] = 60] = "LINK";
|
|
|
|
TAG_ID[TAG_ID["LISTING"] = 61] = "LISTING";
|
|
|
|
TAG_ID[TAG_ID["MAIN"] = 62] = "MAIN";
|
|
|
|
TAG_ID[TAG_ID["MALIGNMARK"] = 63] = "MALIGNMARK";
|
|
|
|
TAG_ID[TAG_ID["MARQUEE"] = 64] = "MARQUEE";
|
|
|
|
TAG_ID[TAG_ID["MATH"] = 65] = "MATH";
|
|
|
|
TAG_ID[TAG_ID["MENU"] = 66] = "MENU";
|
|
|
|
TAG_ID[TAG_ID["META"] = 67] = "META";
|
|
|
|
TAG_ID[TAG_ID["MGLYPH"] = 68] = "MGLYPH";
|
|
|
|
TAG_ID[TAG_ID["MI"] = 69] = "MI";
|
|
|
|
TAG_ID[TAG_ID["MO"] = 70] = "MO";
|
|
|
|
TAG_ID[TAG_ID["MN"] = 71] = "MN";
|
|
|
|
TAG_ID[TAG_ID["MS"] = 72] = "MS";
|
|
|
|
TAG_ID[TAG_ID["MTEXT"] = 73] = "MTEXT";
|
|
|
|
TAG_ID[TAG_ID["NAV"] = 74] = "NAV";
|
|
|
|
TAG_ID[TAG_ID["NOBR"] = 75] = "NOBR";
|
|
|
|
TAG_ID[TAG_ID["NOFRAMES"] = 76] = "NOFRAMES";
|
|
|
|
TAG_ID[TAG_ID["NOEMBED"] = 77] = "NOEMBED";
|
|
|
|
TAG_ID[TAG_ID["NOSCRIPT"] = 78] = "NOSCRIPT";
|
|
|
|
TAG_ID[TAG_ID["OBJECT"] = 79] = "OBJECT";
|
|
|
|
TAG_ID[TAG_ID["OL"] = 80] = "OL";
|
|
|
|
TAG_ID[TAG_ID["OPTGROUP"] = 81] = "OPTGROUP";
|
|
|
|
TAG_ID[TAG_ID["OPTION"] = 82] = "OPTION";
|
|
|
|
TAG_ID[TAG_ID["P"] = 83] = "P";
|
|
|
|
TAG_ID[TAG_ID["PARAM"] = 84] = "PARAM";
|
|
|
|
TAG_ID[TAG_ID["PLAINTEXT"] = 85] = "PLAINTEXT";
|
|
|
|
TAG_ID[TAG_ID["PRE"] = 86] = "PRE";
|
|
|
|
TAG_ID[TAG_ID["RB"] = 87] = "RB";
|
|
|
|
TAG_ID[TAG_ID["RP"] = 88] = "RP";
|
|
|
|
TAG_ID[TAG_ID["RT"] = 89] = "RT";
|
|
|
|
TAG_ID[TAG_ID["RTC"] = 90] = "RTC";
|
|
|
|
TAG_ID[TAG_ID["RUBY"] = 91] = "RUBY";
|
|
|
|
TAG_ID[TAG_ID["S"] = 92] = "S";
|
|
|
|
TAG_ID[TAG_ID["SCRIPT"] = 93] = "SCRIPT";
|
|
|
|
TAG_ID[TAG_ID["SECTION"] = 94] = "SECTION";
|
|
|
|
TAG_ID[TAG_ID["SELECT"] = 95] = "SELECT";
|
|
|
|
TAG_ID[TAG_ID["SOURCE"] = 96] = "SOURCE";
|
|
|
|
TAG_ID[TAG_ID["SMALL"] = 97] = "SMALL";
|
|
|
|
TAG_ID[TAG_ID["SPAN"] = 98] = "SPAN";
|
|
|
|
TAG_ID[TAG_ID["STRIKE"] = 99] = "STRIKE";
|
|
|
|
TAG_ID[TAG_ID["STRONG"] = 100] = "STRONG";
|
|
|
|
TAG_ID[TAG_ID["STYLE"] = 101] = "STYLE";
|
|
|
|
TAG_ID[TAG_ID["SUB"] = 102] = "SUB";
|
|
|
|
TAG_ID[TAG_ID["SUMMARY"] = 103] = "SUMMARY";
|
|
|
|
TAG_ID[TAG_ID["SUP"] = 104] = "SUP";
|
|
|
|
TAG_ID[TAG_ID["TABLE"] = 105] = "TABLE";
|
|
|
|
TAG_ID[TAG_ID["TBODY"] = 106] = "TBODY";
|
|
|
|
TAG_ID[TAG_ID["TEMPLATE"] = 107] = "TEMPLATE";
|
|
|
|
TAG_ID[TAG_ID["TEXTAREA"] = 108] = "TEXTAREA";
|
|
|
|
TAG_ID[TAG_ID["TFOOT"] = 109] = "TFOOT";
|
|
|
|
TAG_ID[TAG_ID["TD"] = 110] = "TD";
|
|
|
|
TAG_ID[TAG_ID["TH"] = 111] = "TH";
|
|
|
|
TAG_ID[TAG_ID["THEAD"] = 112] = "THEAD";
|
|
|
|
TAG_ID[TAG_ID["TITLE"] = 113] = "TITLE";
|
|
|
|
TAG_ID[TAG_ID["TR"] = 114] = "TR";
|
|
|
|
TAG_ID[TAG_ID["TRACK"] = 115] = "TRACK";
|
|
|
|
TAG_ID[TAG_ID["TT"] = 116] = "TT";
|
|
|
|
TAG_ID[TAG_ID["U"] = 117] = "U";
|
|
|
|
TAG_ID[TAG_ID["UL"] = 118] = "UL";
|
|
|
|
TAG_ID[TAG_ID["SVG"] = 119] = "SVG";
|
|
|
|
TAG_ID[TAG_ID["VAR"] = 120] = "VAR";
|
|
|
|
TAG_ID[TAG_ID["WBR"] = 121] = "WBR";
|
|
|
|
TAG_ID[TAG_ID["XMP"] = 122] = "XMP";
|
|
|
|
})(TAG_ID = exports.TAG_ID || (exports.TAG_ID = {}));
|
|
|
|
const TAG_NAME_TO_ID = new Map([
|
|
|
|
[TAG_NAMES.A, TAG_ID.A],
|
|
|
|
[TAG_NAMES.ADDRESS, TAG_ID.ADDRESS],
|
|
|
|
[TAG_NAMES.ANNOTATION_XML, TAG_ID.ANNOTATION_XML],
|
|
|
|
[TAG_NAMES.APPLET, TAG_ID.APPLET],
|
|
|
|
[TAG_NAMES.AREA, TAG_ID.AREA],
|
|
|
|
[TAG_NAMES.ARTICLE, TAG_ID.ARTICLE],
|
|
|
|
[TAG_NAMES.ASIDE, TAG_ID.ASIDE],
|
|
|
|
[TAG_NAMES.B, TAG_ID.B],
|
|
|
|
[TAG_NAMES.BASE, TAG_ID.BASE],
|
|
|
|
[TAG_NAMES.BASEFONT, TAG_ID.BASEFONT],
|
|
|
|
[TAG_NAMES.BGSOUND, TAG_ID.BGSOUND],
|
|
|
|
[TAG_NAMES.BIG, TAG_ID.BIG],
|
|
|
|
[TAG_NAMES.BLOCKQUOTE, TAG_ID.BLOCKQUOTE],
|
|
|
|
[TAG_NAMES.BODY, TAG_ID.BODY],
|
|
|
|
[TAG_NAMES.BR, TAG_ID.BR],
|
|
|
|
[TAG_NAMES.BUTTON, TAG_ID.BUTTON],
|
|
|
|
[TAG_NAMES.CAPTION, TAG_ID.CAPTION],
|
|
|
|
[TAG_NAMES.CENTER, TAG_ID.CENTER],
|
|
|
|
[TAG_NAMES.CODE, TAG_ID.CODE],
|
|
|
|
[TAG_NAMES.COL, TAG_ID.COL],
|
|
|
|
[TAG_NAMES.COLGROUP, TAG_ID.COLGROUP],
|
|
|
|
[TAG_NAMES.DD, TAG_ID.DD],
|
|
|
|
[TAG_NAMES.DESC, TAG_ID.DESC],
|
|
|
|
[TAG_NAMES.DETAILS, TAG_ID.DETAILS],
|
|
|
|
[TAG_NAMES.DIALOG, TAG_ID.DIALOG],
|
|
|
|
[TAG_NAMES.DIR, TAG_ID.DIR],
|
|
|
|
[TAG_NAMES.DIV, TAG_ID.DIV],
|
|
|
|
[TAG_NAMES.DL, TAG_ID.DL],
|
|
|
|
[TAG_NAMES.DT, TAG_ID.DT],
|
|
|
|
[TAG_NAMES.EM, TAG_ID.EM],
|
|
|
|
[TAG_NAMES.EMBED, TAG_ID.EMBED],
|
|
|
|
[TAG_NAMES.FIELDSET, TAG_ID.FIELDSET],
|
|
|
|
[TAG_NAMES.FIGCAPTION, TAG_ID.FIGCAPTION],
|
|
|
|
[TAG_NAMES.FIGURE, TAG_ID.FIGURE],
|
|
|
|
[TAG_NAMES.FONT, TAG_ID.FONT],
|
|
|
|
[TAG_NAMES.FOOTER, TAG_ID.FOOTER],
|
|
|
|
[TAG_NAMES.FOREIGN_OBJECT, TAG_ID.FOREIGN_OBJECT],
|
|
|
|
[TAG_NAMES.FORM, TAG_ID.FORM],
|
|
|
|
[TAG_NAMES.FRAME, TAG_ID.FRAME],
|
|
|
|
[TAG_NAMES.FRAMESET, TAG_ID.FRAMESET],
|
|
|
|
[TAG_NAMES.H1, TAG_ID.H1],
|
|
|
|
[TAG_NAMES.H2, TAG_ID.H2],
|
|
|
|
[TAG_NAMES.H3, TAG_ID.H3],
|
|
|
|
[TAG_NAMES.H4, TAG_ID.H4],
|
|
|
|
[TAG_NAMES.H5, TAG_ID.H5],
|
|
|
|
[TAG_NAMES.H6, TAG_ID.H6],
|
|
|
|
[TAG_NAMES.HEAD, TAG_ID.HEAD],
|
|
|
|
[TAG_NAMES.HEADER, TAG_ID.HEADER],
|
|
|
|
[TAG_NAMES.HGROUP, TAG_ID.HGROUP],
|
|
|
|
[TAG_NAMES.HR, TAG_ID.HR],
|
|
|
|
[TAG_NAMES.HTML, TAG_ID.HTML],
|
|
|
|
[TAG_NAMES.I, TAG_ID.I],
|
|
|
|
[TAG_NAMES.IMG, TAG_ID.IMG],
|
|
|
|
[TAG_NAMES.IMAGE, TAG_ID.IMAGE],
|
|
|
|
[TAG_NAMES.INPUT, TAG_ID.INPUT],
|
|
|
|
[TAG_NAMES.IFRAME, TAG_ID.IFRAME],
|
|
|
|
[TAG_NAMES.KEYGEN, TAG_ID.KEYGEN],
|
|
|
|
[TAG_NAMES.LABEL, TAG_ID.LABEL],
|
|
|
|
[TAG_NAMES.LI, TAG_ID.LI],
|
|
|
|
[TAG_NAMES.LINK, TAG_ID.LINK],
|
|
|
|
[TAG_NAMES.LISTING, TAG_ID.LISTING],
|
|
|
|
[TAG_NAMES.MAIN, TAG_ID.MAIN],
|
|
|
|
[TAG_NAMES.MALIGNMARK, TAG_ID.MALIGNMARK],
|
|
|
|
[TAG_NAMES.MARQUEE, TAG_ID.MARQUEE],
|
|
|
|
[TAG_NAMES.MATH, TAG_ID.MATH],
|
|
|
|
[TAG_NAMES.MENU, TAG_ID.MENU],
|
|
|
|
[TAG_NAMES.META, TAG_ID.META],
|
|
|
|
[TAG_NAMES.MGLYPH, TAG_ID.MGLYPH],
|
|
|
|
[TAG_NAMES.MI, TAG_ID.MI],
|
|
|
|
[TAG_NAMES.MO, TAG_ID.MO],
|
|
|
|
[TAG_NAMES.MN, TAG_ID.MN],
|
|
|
|
[TAG_NAMES.MS, TAG_ID.MS],
|
|
|
|
[TAG_NAMES.MTEXT, TAG_ID.MTEXT],
|
|
|
|
[TAG_NAMES.NAV, TAG_ID.NAV],
|
|
|
|
[TAG_NAMES.NOBR, TAG_ID.NOBR],
|
|
|
|
[TAG_NAMES.NOFRAMES, TAG_ID.NOFRAMES],
|
|
|
|
[TAG_NAMES.NOEMBED, TAG_ID.NOEMBED],
|
|
|
|
[TAG_NAMES.NOSCRIPT, TAG_ID.NOSCRIPT],
|
|
|
|
[TAG_NAMES.OBJECT, TAG_ID.OBJECT],
|
|
|
|
[TAG_NAMES.OL, TAG_ID.OL],
|
|
|
|
[TAG_NAMES.OPTGROUP, TAG_ID.OPTGROUP],
|
|
|
|
[TAG_NAMES.OPTION, TAG_ID.OPTION],
|
|
|
|
[TAG_NAMES.P, TAG_ID.P],
|
|
|
|
[TAG_NAMES.PARAM, TAG_ID.PARAM],
|
|
|
|
[TAG_NAMES.PLAINTEXT, TAG_ID.PLAINTEXT],
|
|
|
|
[TAG_NAMES.PRE, TAG_ID.PRE],
|
|
|
|
[TAG_NAMES.RB, TAG_ID.RB],
|
|
|
|
[TAG_NAMES.RP, TAG_ID.RP],
|
|
|
|
[TAG_NAMES.RT, TAG_ID.RT],
|
|
|
|
[TAG_NAMES.RTC, TAG_ID.RTC],
|
|
|
|
[TAG_NAMES.RUBY, TAG_ID.RUBY],
|
|
|
|
[TAG_NAMES.S, TAG_ID.S],
|
|
|
|
[TAG_NAMES.SCRIPT, TAG_ID.SCRIPT],
|
|
|
|
[TAG_NAMES.SECTION, TAG_ID.SECTION],
|
|
|
|
[TAG_NAMES.SELECT, TAG_ID.SELECT],
|
|
|
|
[TAG_NAMES.SOURCE, TAG_ID.SOURCE],
|
|
|
|
[TAG_NAMES.SMALL, TAG_ID.SMALL],
|
|
|
|
[TAG_NAMES.SPAN, TAG_ID.SPAN],
|
|
|
|
[TAG_NAMES.STRIKE, TAG_ID.STRIKE],
|
|
|
|
[TAG_NAMES.STRONG, TAG_ID.STRONG],
|
|
|
|
[TAG_NAMES.STYLE, TAG_ID.STYLE],
|
|
|
|
[TAG_NAMES.SUB, TAG_ID.SUB],
|
|
|
|
[TAG_NAMES.SUMMARY, TAG_ID.SUMMARY],
|
|
|
|
[TAG_NAMES.SUP, TAG_ID.SUP],
|
|
|
|
[TAG_NAMES.TABLE, TAG_ID.TABLE],
|
|
|
|
[TAG_NAMES.TBODY, TAG_ID.TBODY],
|
|
|
|
[TAG_NAMES.TEMPLATE, TAG_ID.TEMPLATE],
|
|
|
|
[TAG_NAMES.TEXTAREA, TAG_ID.TEXTAREA],
|
|
|
|
[TAG_NAMES.TFOOT, TAG_ID.TFOOT],
|
|
|
|
[TAG_NAMES.TD, TAG_ID.TD],
|
|
|
|
[TAG_NAMES.TH, TAG_ID.TH],
|
|
|
|
[TAG_NAMES.THEAD, TAG_ID.THEAD],
|
|
|
|
[TAG_NAMES.TITLE, TAG_ID.TITLE],
|
|
|
|
[TAG_NAMES.TR, TAG_ID.TR],
|
|
|
|
[TAG_NAMES.TRACK, TAG_ID.TRACK],
|
|
|
|
[TAG_NAMES.TT, TAG_ID.TT],
|
|
|
|
[TAG_NAMES.U, TAG_ID.U],
|
|
|
|
[TAG_NAMES.UL, TAG_ID.UL],
|
|
|
|
[TAG_NAMES.SVG, TAG_ID.SVG],
|
|
|
|
[TAG_NAMES.VAR, TAG_ID.VAR],
|
|
|
|
[TAG_NAMES.WBR, TAG_ID.WBR],
|
|
|
|
[TAG_NAMES.XMP, TAG_ID.XMP],
|
|
|
|
]);
|
|
|
|
function getTagID(tagName) {
|
|
|
|
var _a;
|
|
|
|
return (_a = TAG_NAME_TO_ID.get(tagName)) !== null && _a !== void 0 ? _a : TAG_ID.UNKNOWN;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
exports.getTagID = getTagID;
|
|
|
|
const $ = TAG_ID;
|
2020-12-18 22:06:30 +00:00
|
|
|
exports.SPECIAL_ELEMENTS = {
|
2022-05-17 01:25:05 +00:00
|
|
|
[NS.HTML]: new Set([
|
|
|
|
$.ADDRESS,
|
|
|
|
$.APPLET,
|
|
|
|
$.AREA,
|
|
|
|
$.ARTICLE,
|
|
|
|
$.ASIDE,
|
|
|
|
$.BASE,
|
|
|
|
$.BASEFONT,
|
|
|
|
$.BGSOUND,
|
|
|
|
$.BLOCKQUOTE,
|
|
|
|
$.BODY,
|
|
|
|
$.BR,
|
|
|
|
$.BUTTON,
|
|
|
|
$.CAPTION,
|
|
|
|
$.CENTER,
|
|
|
|
$.COL,
|
|
|
|
$.COLGROUP,
|
|
|
|
$.DD,
|
|
|
|
$.DETAILS,
|
|
|
|
$.DIR,
|
|
|
|
$.DIV,
|
|
|
|
$.DL,
|
|
|
|
$.DT,
|
|
|
|
$.EMBED,
|
|
|
|
$.FIELDSET,
|
|
|
|
$.FIGCAPTION,
|
|
|
|
$.FIGURE,
|
|
|
|
$.FOOTER,
|
|
|
|
$.FORM,
|
|
|
|
$.FRAME,
|
|
|
|
$.FRAMESET,
|
|
|
|
$.H1,
|
|
|
|
$.H2,
|
|
|
|
$.H3,
|
|
|
|
$.H4,
|
|
|
|
$.H5,
|
|
|
|
$.H6,
|
|
|
|
$.HEAD,
|
|
|
|
$.HEADER,
|
|
|
|
$.HGROUP,
|
|
|
|
$.HR,
|
|
|
|
$.HTML,
|
|
|
|
$.IFRAME,
|
|
|
|
$.IMG,
|
|
|
|
$.INPUT,
|
|
|
|
$.LI,
|
|
|
|
$.LINK,
|
|
|
|
$.LISTING,
|
|
|
|
$.MAIN,
|
|
|
|
$.MARQUEE,
|
|
|
|
$.MENU,
|
|
|
|
$.META,
|
|
|
|
$.NAV,
|
|
|
|
$.NOEMBED,
|
|
|
|
$.NOFRAMES,
|
|
|
|
$.NOSCRIPT,
|
|
|
|
$.OBJECT,
|
|
|
|
$.OL,
|
|
|
|
$.P,
|
|
|
|
$.PARAM,
|
|
|
|
$.PLAINTEXT,
|
|
|
|
$.PRE,
|
|
|
|
$.SCRIPT,
|
|
|
|
$.SECTION,
|
|
|
|
$.SELECT,
|
|
|
|
$.SOURCE,
|
|
|
|
$.STYLE,
|
|
|
|
$.SUMMARY,
|
|
|
|
$.TABLE,
|
|
|
|
$.TBODY,
|
|
|
|
$.TD,
|
|
|
|
$.TEMPLATE,
|
|
|
|
$.TEXTAREA,
|
|
|
|
$.TFOOT,
|
|
|
|
$.TH,
|
|
|
|
$.THEAD,
|
|
|
|
$.TITLE,
|
|
|
|
$.TR,
|
|
|
|
$.TRACK,
|
|
|
|
$.UL,
|
|
|
|
$.WBR,
|
|
|
|
$.XMP,
|
|
|
|
]),
|
|
|
|
[NS.MATHML]: new Set([$.MI, $.MO, $.MN, $.MS, $.MTEXT, $.ANNOTATION_XML]),
|
|
|
|
[NS.SVG]: new Set([$.TITLE, $.FOREIGN_OBJECT, $.DESC]),
|
|
|
|
[NS.XLINK]: new Set(),
|
|
|
|
[NS.XML]: new Set(),
|
|
|
|
[NS.XMLNS]: new Set(),
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
2022-05-17 01:25:05 +00:00
|
|
|
function isNumberedHeader(tn) {
|
|
|
|
return tn === $.H1 || tn === $.H2 || tn === $.H3 || tn === $.H4 || tn === $.H5 || tn === $.H6;
|
|
|
|
}
|
|
|
|
exports.isNumberedHeader = isNumberedHeader;
|
|
|
|
const UNESCAPED_TEXT = new Set([
|
|
|
|
TAG_NAMES.STYLE,
|
|
|
|
TAG_NAMES.SCRIPT,
|
|
|
|
TAG_NAMES.XMP,
|
|
|
|
TAG_NAMES.IFRAME,
|
|
|
|
TAG_NAMES.NOEMBED,
|
|
|
|
TAG_NAMES.NOFRAMES,
|
|
|
|
TAG_NAMES.PLAINTEXT,
|
|
|
|
]);
|
|
|
|
function hasUnescapedText(tn, scriptingEnabled) {
|
|
|
|
return UNESCAPED_TEXT.has(tn) || (scriptingEnabled && tn === TAG_NAMES.NOSCRIPT);
|
|
|
|
}
|
|
|
|
exports.hasUnescapedText = hasUnescapedText;
|
2020-12-18 22:06:30 +00:00
|
|
|
|
|
|
|
},{}],5:[function(require,module,exports){
|
2022-05-17 01:25:05 +00:00
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.getTokenAttr = exports.TokenType = void 0;
|
|
|
|
var TokenType;
|
|
|
|
(function (TokenType) {
|
|
|
|
TokenType[TokenType["CHARACTER"] = 0] = "CHARACTER";
|
|
|
|
TokenType[TokenType["NULL_CHARACTER"] = 1] = "NULL_CHARACTER";
|
|
|
|
TokenType[TokenType["WHITESPACE_CHARACTER"] = 2] = "WHITESPACE_CHARACTER";
|
|
|
|
TokenType[TokenType["START_TAG"] = 3] = "START_TAG";
|
|
|
|
TokenType[TokenType["END_TAG"] = 4] = "END_TAG";
|
|
|
|
TokenType[TokenType["COMMENT"] = 5] = "COMMENT";
|
|
|
|
TokenType[TokenType["DOCTYPE"] = 6] = "DOCTYPE";
|
|
|
|
TokenType[TokenType["EOF"] = 7] = "EOF";
|
|
|
|
TokenType[TokenType["HIBERNATION"] = 8] = "HIBERNATION";
|
|
|
|
})(TokenType = exports.TokenType || (exports.TokenType = {}));
|
|
|
|
function getTokenAttr(token, attrName) {
|
|
|
|
for (let i = token.attrs.length - 1; i >= 0; i--) {
|
|
|
|
if (token.attrs[i].name === attrName) {
|
|
|
|
return token.attrs[i].value;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
exports.getTokenAttr = getTokenAttr;
|
2020-12-18 22:06:30 +00:00
|
|
|
|
2022-05-17 01:25:05 +00:00
|
|
|
},{}],6:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.isUndefinedCodePoint = exports.isControlCodePoint = exports.getSurrogatePairCodePoint = exports.isSurrogatePair = exports.isSurrogate = exports.SEQUENCES = exports.CODE_POINTS = exports.REPLACEMENT_CHARACTER = void 0;
|
|
|
|
const UNDEFINED_CODE_POINTS = new Set([
|
|
|
|
65534, 65535, 131070, 131071, 196606, 196607, 262142, 262143, 327678, 327679, 393214,
|
|
|
|
393215, 458750, 458751, 524286, 524287, 589822, 589823, 655358, 655359, 720894,
|
|
|
|
720895, 786430, 786431, 851966, 851967, 917502, 917503, 983038, 983039, 1048574,
|
|
|
|
1048575, 1114110, 1114111,
|
|
|
|
]);
|
2020-12-18 22:06:30 +00:00
|
|
|
exports.REPLACEMENT_CHARACTER = '\uFFFD';
|
2022-05-17 01:25:05 +00:00
|
|
|
var CODE_POINTS;
|
|
|
|
(function (CODE_POINTS) {
|
|
|
|
CODE_POINTS[CODE_POINTS["EOF"] = -1] = "EOF";
|
|
|
|
CODE_POINTS[CODE_POINTS["NULL"] = 0] = "NULL";
|
|
|
|
CODE_POINTS[CODE_POINTS["TABULATION"] = 9] = "TABULATION";
|
|
|
|
CODE_POINTS[CODE_POINTS["CARRIAGE_RETURN"] = 13] = "CARRIAGE_RETURN";
|
|
|
|
CODE_POINTS[CODE_POINTS["LINE_FEED"] = 10] = "LINE_FEED";
|
|
|
|
CODE_POINTS[CODE_POINTS["FORM_FEED"] = 12] = "FORM_FEED";
|
|
|
|
CODE_POINTS[CODE_POINTS["SPACE"] = 32] = "SPACE";
|
|
|
|
CODE_POINTS[CODE_POINTS["EXCLAMATION_MARK"] = 33] = "EXCLAMATION_MARK";
|
|
|
|
CODE_POINTS[CODE_POINTS["QUOTATION_MARK"] = 34] = "QUOTATION_MARK";
|
|
|
|
CODE_POINTS[CODE_POINTS["NUMBER_SIGN"] = 35] = "NUMBER_SIGN";
|
|
|
|
CODE_POINTS[CODE_POINTS["AMPERSAND"] = 38] = "AMPERSAND";
|
|
|
|
CODE_POINTS[CODE_POINTS["APOSTROPHE"] = 39] = "APOSTROPHE";
|
|
|
|
CODE_POINTS[CODE_POINTS["HYPHEN_MINUS"] = 45] = "HYPHEN_MINUS";
|
|
|
|
CODE_POINTS[CODE_POINTS["SOLIDUS"] = 47] = "SOLIDUS";
|
|
|
|
CODE_POINTS[CODE_POINTS["DIGIT_0"] = 48] = "DIGIT_0";
|
|
|
|
CODE_POINTS[CODE_POINTS["DIGIT_9"] = 57] = "DIGIT_9";
|
|
|
|
CODE_POINTS[CODE_POINTS["SEMICOLON"] = 59] = "SEMICOLON";
|
|
|
|
CODE_POINTS[CODE_POINTS["LESS_THAN_SIGN"] = 60] = "LESS_THAN_SIGN";
|
|
|
|
CODE_POINTS[CODE_POINTS["EQUALS_SIGN"] = 61] = "EQUALS_SIGN";
|
|
|
|
CODE_POINTS[CODE_POINTS["GREATER_THAN_SIGN"] = 62] = "GREATER_THAN_SIGN";
|
|
|
|
CODE_POINTS[CODE_POINTS["QUESTION_MARK"] = 63] = "QUESTION_MARK";
|
|
|
|
CODE_POINTS[CODE_POINTS["LATIN_CAPITAL_A"] = 65] = "LATIN_CAPITAL_A";
|
|
|
|
CODE_POINTS[CODE_POINTS["LATIN_CAPITAL_F"] = 70] = "LATIN_CAPITAL_F";
|
|
|
|
CODE_POINTS[CODE_POINTS["LATIN_CAPITAL_X"] = 88] = "LATIN_CAPITAL_X";
|
|
|
|
CODE_POINTS[CODE_POINTS["LATIN_CAPITAL_Z"] = 90] = "LATIN_CAPITAL_Z";
|
|
|
|
CODE_POINTS[CODE_POINTS["RIGHT_SQUARE_BRACKET"] = 93] = "RIGHT_SQUARE_BRACKET";
|
|
|
|
CODE_POINTS[CODE_POINTS["GRAVE_ACCENT"] = 96] = "GRAVE_ACCENT";
|
|
|
|
CODE_POINTS[CODE_POINTS["LATIN_SMALL_A"] = 97] = "LATIN_SMALL_A";
|
|
|
|
CODE_POINTS[CODE_POINTS["LATIN_SMALL_F"] = 102] = "LATIN_SMALL_F";
|
|
|
|
CODE_POINTS[CODE_POINTS["LATIN_SMALL_X"] = 120] = "LATIN_SMALL_X";
|
|
|
|
CODE_POINTS[CODE_POINTS["LATIN_SMALL_Z"] = 122] = "LATIN_SMALL_Z";
|
|
|
|
CODE_POINTS[CODE_POINTS["REPLACEMENT_CHARACTER"] = 65533] = "REPLACEMENT_CHARACTER";
|
|
|
|
})(CODE_POINTS = exports.CODE_POINTS || (exports.CODE_POINTS = {}));
|
|
|
|
exports.SEQUENCES = {
|
|
|
|
DASH_DASH: '--',
|
|
|
|
CDATA_START: '[CDATA[',
|
|
|
|
DOCTYPE: 'doctype',
|
|
|
|
SCRIPT: 'script',
|
|
|
|
PUBLIC: 'public',
|
|
|
|
SYSTEM: 'system',
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
|
|
|
//Surrogates
|
2022-05-17 01:25:05 +00:00
|
|
|
function isSurrogate(cp) {
|
|
|
|
return cp >= 55296 && cp <= 57343;
|
|
|
|
}
|
|
|
|
exports.isSurrogate = isSurrogate;
|
|
|
|
function isSurrogatePair(cp) {
|
|
|
|
return cp >= 56320 && cp <= 57343;
|
|
|
|
}
|
|
|
|
exports.isSurrogatePair = isSurrogatePair;
|
|
|
|
function getSurrogatePairCodePoint(cp1, cp2) {
|
|
|
|
return (cp1 - 55296) * 1024 + 9216 + cp2;
|
|
|
|
}
|
|
|
|
exports.getSurrogatePairCodePoint = getSurrogatePairCodePoint;
|
2020-12-18 22:06:30 +00:00
|
|
|
//NOTE: excluding NULL and ASCII whitespace
|
2022-05-17 01:25:05 +00:00
|
|
|
function isControlCodePoint(cp) {
|
|
|
|
return ((cp !== 0x20 && cp !== 0x0a && cp !== 0x0d && cp !== 0x09 && cp !== 0x0c && cp >= 0x01 && cp <= 0x1f) ||
|
|
|
|
(cp >= 0x7f && cp <= 0x9f));
|
|
|
|
}
|
|
|
|
exports.isControlCodePoint = isControlCodePoint;
|
|
|
|
function isUndefinedCodePoint(cp) {
|
|
|
|
return (cp >= 64976 && cp <= 65007) || UNDEFINED_CODE_POINTS.has(cp);
|
|
|
|
}
|
|
|
|
exports.isUndefinedCodePoint = isUndefinedCodePoint;
|
|
|
|
|
|
|
|
},{}],7:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.parseFragment = exports.parse = exports.TokenizerMode = exports.Tokenizer = exports.Token = exports.html = exports.foreignContent = exports.serializeOuter = exports.serialize = exports.Parser = exports.defaultTreeAdapter = void 0;
|
|
|
|
const index_js_1 = require("./parser/index.js");
|
|
|
|
var default_js_1 = require("./tree-adapters/default.js");
|
|
|
|
Object.defineProperty(exports, "defaultTreeAdapter", { enumerable: true, get: function () { return default_js_1.defaultTreeAdapter; } });
|
|
|
|
var index_js_2 = require("./parser/index.js");
|
|
|
|
Object.defineProperty(exports, "Parser", { enumerable: true, get: function () { return index_js_2.Parser; } });
|
|
|
|
var index_js_3 = require("./serializer/index.js");
|
|
|
|
Object.defineProperty(exports, "serialize", { enumerable: true, get: function () { return index_js_3.serialize; } });
|
|
|
|
Object.defineProperty(exports, "serializeOuter", { enumerable: true, get: function () { return index_js_3.serializeOuter; } });
|
|
|
|
/** @internal */
|
|
|
|
exports.foreignContent = require("./common/foreign-content.js");
|
|
|
|
/** @internal */
|
|
|
|
exports.html = require("./common/html.js");
|
|
|
|
/** @internal */
|
|
|
|
exports.Token = require("./common/token.js");
|
|
|
|
/** @internal */
|
|
|
|
var index_js_4 = require("./tokenizer/index.js");
|
|
|
|
Object.defineProperty(exports, "Tokenizer", { enumerable: true, get: function () { return index_js_4.Tokenizer; } });
|
|
|
|
Object.defineProperty(exports, "TokenizerMode", { enumerable: true, get: function () { return index_js_4.TokenizerMode; } });
|
|
|
|
// Shorthands
|
|
|
|
/**
|
|
|
|
* Parses an HTML string.
|
|
|
|
*
|
|
|
|
* @param html Input HTML string.
|
|
|
|
* @param options Parsing options.
|
|
|
|
* @returns Document
|
|
|
|
*
|
|
|
|
* @example
|
|
|
|
*
|
|
|
|
* ```js
|
|
|
|
* const parse5 = require('parse5');
|
|
|
|
*
|
|
|
|
* const document = parse5.parse('<!DOCTYPE html><html><head></head><body>Hi there!</body></html>');
|
|
|
|
*
|
|
|
|
* console.log(document.childNodes[1].tagName); //> 'html'
|
|
|
|
*```
|
|
|
|
*/
|
|
|
|
function parse(html, options) {
|
|
|
|
return index_js_1.Parser.parse(html, options);
|
|
|
|
}
|
|
|
|
exports.parse = parse;
|
|
|
|
function parseFragment(fragmentContext, html, options) {
|
|
|
|
if (typeof fragmentContext === 'string') {
|
|
|
|
options = html;
|
|
|
|
html = fragmentContext;
|
|
|
|
fragmentContext = null;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
const parser = index_js_1.Parser.getFragmentParser(fragmentContext, options);
|
|
|
|
parser.tokenizer.write(html, true);
|
|
|
|
return parser.getFragment();
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
exports.parseFragment = parseFragment;
|
2020-12-18 22:06:30 +00:00
|
|
|
|
2022-05-17 01:25:05 +00:00
|
|
|
},{"./common/foreign-content.js":3,"./common/html.js":4,"./common/token.js":5,"./parser/index.js":9,"./serializer/index.js":11,"./tokenizer/index.js":12,"./tree-adapters/default.js":14}],8:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.FormattingElementList = exports.EntryType = void 0;
|
|
|
|
//Const
|
|
|
|
const NOAH_ARK_CAPACITY = 3;
|
|
|
|
var EntryType;
|
|
|
|
(function (EntryType) {
|
|
|
|
EntryType[EntryType["Marker"] = 0] = "Marker";
|
|
|
|
EntryType[EntryType["Element"] = 1] = "Element";
|
|
|
|
})(EntryType = exports.EntryType || (exports.EntryType = {}));
|
|
|
|
const MARKER = { type: EntryType.Marker };
|
|
|
|
//List of formatting elements
|
|
|
|
class FormattingElementList {
|
|
|
|
constructor(treeAdapter) {
|
|
|
|
this.treeAdapter = treeAdapter;
|
|
|
|
this.entries = [];
|
|
|
|
this.bookmark = null;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
//Noah Ark's condition
|
|
|
|
//OPTIMIZATION: at first we try to find possible candidates for exclusion using
|
|
|
|
//lightweight heuristics without thorough attributes check.
|
|
|
|
_getNoahArkConditionCandidates(newElement, neAttrs) {
|
|
|
|
const candidates = [];
|
|
|
|
const neAttrsLength = neAttrs.length;
|
|
|
|
const neTagName = this.treeAdapter.getTagName(newElement);
|
|
|
|
const neNamespaceURI = this.treeAdapter.getNamespaceURI(newElement);
|
|
|
|
for (let i = 0; i < this.entries.length; i++) {
|
|
|
|
const entry = this.entries[i];
|
|
|
|
if (entry.type === EntryType.Marker) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
const { element } = entry;
|
|
|
|
if (this.treeAdapter.getTagName(element) === neTagName &&
|
|
|
|
this.treeAdapter.getNamespaceURI(element) === neNamespaceURI) {
|
|
|
|
const elementAttrs = this.treeAdapter.getAttrList(element);
|
|
|
|
if (elementAttrs.length === neAttrsLength) {
|
|
|
|
candidates.push({ idx: i, attrs: elementAttrs });
|
|
|
|
}
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
return candidates;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_ensureNoahArkCondition(newElement) {
|
|
|
|
if (this.entries.length < NOAH_ARK_CAPACITY)
|
|
|
|
return;
|
|
|
|
const neAttrs = this.treeAdapter.getAttrList(newElement);
|
|
|
|
const candidates = this._getNoahArkConditionCandidates(newElement, neAttrs);
|
|
|
|
if (candidates.length < NOAH_ARK_CAPACITY)
|
|
|
|
return;
|
|
|
|
//NOTE: build attrs map for the new element, so we can perform fast lookups
|
|
|
|
const neAttrsMap = new Map(neAttrs.map((neAttr) => [neAttr.name, neAttr.value]));
|
|
|
|
let validCandidates = 0;
|
|
|
|
//NOTE: remove bottommost candidates, until Noah's Ark condition will not be met
|
|
|
|
for (let i = 0; i < candidates.length; i++) {
|
|
|
|
const candidate = candidates[i];
|
|
|
|
// We know that `candidate.attrs.length === neAttrs.length`
|
|
|
|
if (candidate.attrs.every((cAttr) => neAttrsMap.get(cAttr.name) === cAttr.value)) {
|
|
|
|
validCandidates += 1;
|
|
|
|
if (validCandidates >= NOAH_ARK_CAPACITY) {
|
|
|
|
this.entries.splice(candidate.idx, 1);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
//Mutations
|
|
|
|
insertMarker() {
|
|
|
|
this.entries.unshift(MARKER);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
pushElement(element, token) {
|
|
|
|
this._ensureNoahArkCondition(element);
|
|
|
|
this.entries.unshift({
|
|
|
|
type: EntryType.Element,
|
|
|
|
element,
|
|
|
|
token,
|
|
|
|
});
|
|
|
|
}
|
|
|
|
insertElementAfterBookmark(element, token) {
|
|
|
|
const bookmarkIdx = this.entries.indexOf(this.bookmark);
|
|
|
|
this.entries.splice(bookmarkIdx, 0, {
|
|
|
|
type: EntryType.Element,
|
|
|
|
element,
|
|
|
|
token,
|
|
|
|
});
|
|
|
|
}
|
|
|
|
removeEntry(entry) {
|
|
|
|
const entryIndex = this.entries.indexOf(entry);
|
|
|
|
if (entryIndex >= 0) {
|
|
|
|
this.entries.splice(entryIndex, 1);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
clearToLastMarker() {
|
|
|
|
const markerIdx = this.entries.indexOf(MARKER);
|
|
|
|
if (markerIdx >= 0) {
|
|
|
|
this.entries.splice(0, markerIdx + 1);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this.entries.length = 0;
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
//Search
|
|
|
|
getElementEntryInScopeWithTagName(tagName) {
|
|
|
|
const entry = this.entries.find((entry) => entry.type === EntryType.Marker || this.treeAdapter.getTagName(entry.element) === tagName);
|
|
|
|
return entry && entry.type === EntryType.Element ? entry : null;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
getElementEntry(element) {
|
|
|
|
return this.entries.find((entry) => entry.type === EntryType.Element && entry.element === element);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
exports.FormattingElementList = FormattingElementList;
|
|
|
|
|
|
|
|
},{}],9:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.Parser = void 0;
|
|
|
|
const index_js_1 = require("../tokenizer/index.js");
|
|
|
|
const open_element_stack_js_1 = require("./open-element-stack.js");
|
|
|
|
const formatting_element_list_js_1 = require("./formatting-element-list.js");
|
|
|
|
const default_js_1 = require("../tree-adapters/default.js");
|
|
|
|
const doctype = require("../common/doctype.js");
|
|
|
|
const foreignContent = require("../common/foreign-content.js");
|
|
|
|
const error_codes_js_1 = require("../common/error-codes.js");
|
|
|
|
const unicode = require("../common/unicode.js");
|
|
|
|
const html_js_1 = require("../common/html.js");
|
|
|
|
const token_js_1 = require("../common/token.js");
|
2020-12-18 22:06:30 +00:00
|
|
|
//Misc constants
|
|
|
|
const HIDDEN_INPUT_TYPE = 'hidden';
|
|
|
|
//Adoption agency loops iteration count
|
|
|
|
const AA_OUTER_LOOP_ITER = 8;
|
|
|
|
const AA_INNER_LOOP_ITER = 3;
|
|
|
|
//Insertion modes
|
2022-05-17 01:25:05 +00:00
|
|
|
var InsertionMode;
|
|
|
|
(function (InsertionMode) {
|
|
|
|
InsertionMode[InsertionMode["INITIAL"] = 0] = "INITIAL";
|
|
|
|
InsertionMode[InsertionMode["BEFORE_HTML"] = 1] = "BEFORE_HTML";
|
|
|
|
InsertionMode[InsertionMode["BEFORE_HEAD"] = 2] = "BEFORE_HEAD";
|
|
|
|
InsertionMode[InsertionMode["IN_HEAD"] = 3] = "IN_HEAD";
|
|
|
|
InsertionMode[InsertionMode["IN_HEAD_NO_SCRIPT"] = 4] = "IN_HEAD_NO_SCRIPT";
|
|
|
|
InsertionMode[InsertionMode["AFTER_HEAD"] = 5] = "AFTER_HEAD";
|
|
|
|
InsertionMode[InsertionMode["IN_BODY"] = 6] = "IN_BODY";
|
|
|
|
InsertionMode[InsertionMode["TEXT"] = 7] = "TEXT";
|
|
|
|
InsertionMode[InsertionMode["IN_TABLE"] = 8] = "IN_TABLE";
|
|
|
|
InsertionMode[InsertionMode["IN_TABLE_TEXT"] = 9] = "IN_TABLE_TEXT";
|
|
|
|
InsertionMode[InsertionMode["IN_CAPTION"] = 10] = "IN_CAPTION";
|
|
|
|
InsertionMode[InsertionMode["IN_COLUMN_GROUP"] = 11] = "IN_COLUMN_GROUP";
|
|
|
|
InsertionMode[InsertionMode["IN_TABLE_BODY"] = 12] = "IN_TABLE_BODY";
|
|
|
|
InsertionMode[InsertionMode["IN_ROW"] = 13] = "IN_ROW";
|
|
|
|
InsertionMode[InsertionMode["IN_CELL"] = 14] = "IN_CELL";
|
|
|
|
InsertionMode[InsertionMode["IN_SELECT"] = 15] = "IN_SELECT";
|
|
|
|
InsertionMode[InsertionMode["IN_SELECT_IN_TABLE"] = 16] = "IN_SELECT_IN_TABLE";
|
|
|
|
InsertionMode[InsertionMode["IN_TEMPLATE"] = 17] = "IN_TEMPLATE";
|
|
|
|
InsertionMode[InsertionMode["AFTER_BODY"] = 18] = "AFTER_BODY";
|
|
|
|
InsertionMode[InsertionMode["IN_FRAMESET"] = 19] = "IN_FRAMESET";
|
|
|
|
InsertionMode[InsertionMode["AFTER_FRAMESET"] = 20] = "AFTER_FRAMESET";
|
|
|
|
InsertionMode[InsertionMode["AFTER_AFTER_BODY"] = 21] = "AFTER_AFTER_BODY";
|
|
|
|
InsertionMode[InsertionMode["AFTER_AFTER_FRAMESET"] = 22] = "AFTER_AFTER_FRAMESET";
|
|
|
|
})(InsertionMode || (InsertionMode = {}));
|
|
|
|
const BASE_LOC = {
|
|
|
|
startLine: -1,
|
|
|
|
startCol: -1,
|
|
|
|
startOffset: -1,
|
|
|
|
endLine: -1,
|
|
|
|
endCol: -1,
|
|
|
|
endOffset: -1,
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
2022-05-17 01:25:05 +00:00
|
|
|
const TABLE_STRUCTURE_TAGS = new Set([html_js_1.TAG_ID.TABLE, html_js_1.TAG_ID.TBODY, html_js_1.TAG_ID.TFOOT, html_js_1.TAG_ID.THEAD, html_js_1.TAG_ID.TR]);
|
|
|
|
const defaultParserOptions = {
|
|
|
|
scriptingEnabled: true,
|
|
|
|
sourceCodeLocationInfo: false,
|
|
|
|
treeAdapter: default_js_1.defaultTreeAdapter,
|
|
|
|
onParseError: null,
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
|
|
|
//Parser
|
|
|
|
class Parser {
|
2022-05-17 01:25:05 +00:00
|
|
|
constructor(options, document, fragmentContext = null, scriptHandler = null) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.fragmentContext = fragmentContext;
|
2022-05-17 01:25:05 +00:00
|
|
|
this.scriptHandler = scriptHandler;
|
|
|
|
this.currentToken = null;
|
|
|
|
this.stopped = false;
|
|
|
|
this.insertionMode = InsertionMode.INITIAL;
|
|
|
|
this.originalInsertionMode = InsertionMode.INITIAL;
|
2020-12-18 22:06:30 +00:00
|
|
|
this.headElement = null;
|
|
|
|
this.formElement = null;
|
2022-05-17 01:25:05 +00:00
|
|
|
/** Indicates that the current node is not an element in the HTML namespace */
|
|
|
|
this.currentNotInHTML = false;
|
|
|
|
/**
|
|
|
|
* The template insertion mode stack is maintained from the left.
|
|
|
|
* Ie. the topmost element will always have index 0.
|
|
|
|
*/
|
2020-12-18 22:06:30 +00:00
|
|
|
this.tmplInsertionModeStack = [];
|
|
|
|
this.pendingCharacterTokens = [];
|
|
|
|
this.hasNonWhitespacePendingCharacterToken = false;
|
|
|
|
this.framesetOk = true;
|
|
|
|
this.skipNextNewLine = false;
|
|
|
|
this.fosterParentingEnabled = false;
|
2022-05-17 01:25:05 +00:00
|
|
|
this.options = Object.assign(Object.assign({}, defaultParserOptions), options);
|
|
|
|
this.treeAdapter = this.options.treeAdapter;
|
|
|
|
this.onParseError = this.options.onParseError;
|
|
|
|
// Always enable location info if we report parse errors.
|
|
|
|
if (this.onParseError) {
|
|
|
|
this.options.sourceCodeLocationInfo = true;
|
|
|
|
}
|
|
|
|
this.document = document !== null && document !== void 0 ? document : this.treeAdapter.createDocument();
|
|
|
|
this.tokenizer = new index_js_1.Tokenizer(this.options, this);
|
|
|
|
this.activeFormattingElements = new formatting_element_list_js_1.FormattingElementList(this.treeAdapter);
|
|
|
|
this.fragmentContextID = fragmentContext ? (0, html_js_1.getTagID)(this.treeAdapter.getTagName(fragmentContext)) : html_js_1.TAG_ID.UNKNOWN;
|
|
|
|
this._setContextModes(fragmentContext !== null && fragmentContext !== void 0 ? fragmentContext : this.document, this.fragmentContextID);
|
|
|
|
this.openElements = new open_element_stack_js_1.OpenElementStack(this.document, this.treeAdapter, this);
|
|
|
|
}
|
|
|
|
// API
|
|
|
|
static parse(html, options) {
|
|
|
|
const parser = new this(options);
|
|
|
|
parser.tokenizer.write(html, true);
|
|
|
|
return parser.document;
|
|
|
|
}
|
|
|
|
static getFragmentParser(fragmentContext, options) {
|
|
|
|
const opts = Object.assign(Object.assign({}, defaultParserOptions), options);
|
|
|
|
//NOTE: use a <template> element as the fragment context if no context element was provided,
|
|
|
|
//so we will parse in a "forgiving" manner
|
|
|
|
fragmentContext !== null && fragmentContext !== void 0 ? fragmentContext : (fragmentContext = opts.treeAdapter.createElement(html_js_1.TAG_NAMES.TEMPLATE, html_js_1.NS.HTML, []));
|
|
|
|
//NOTE: create a fake element which will be used as the `document` for fragment parsing.
|
|
|
|
//This is important for jsdom, where a new `document` cannot be created. This led to
|
|
|
|
//fragment parsing messing with the main `document`.
|
|
|
|
const documentMock = opts.treeAdapter.createElement('documentmock', html_js_1.NS.HTML, []);
|
|
|
|
const parser = new this(opts, documentMock, fragmentContext);
|
|
|
|
if (parser.fragmentContextID === html_js_1.TAG_ID.TEMPLATE) {
|
|
|
|
parser.tmplInsertionModeStack.unshift(InsertionMode.IN_TEMPLATE);
|
|
|
|
}
|
|
|
|
parser._initTokenizerForFragmentParsing();
|
|
|
|
parser._insertFakeRootElement();
|
|
|
|
parser._resetInsertionMode();
|
|
|
|
parser._findFormInFragmentContext();
|
|
|
|
return parser;
|
|
|
|
}
|
|
|
|
getFragment() {
|
|
|
|
const rootElement = this.treeAdapter.getFirstChild(this.document);
|
|
|
|
const fragment = this.treeAdapter.createDocumentFragment();
|
|
|
|
this._adoptNodes(rootElement, fragment);
|
|
|
|
return fragment;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Errors
|
2022-05-17 01:25:05 +00:00
|
|
|
_err(token, code, beforeToken) {
|
|
|
|
var _a;
|
|
|
|
if (!this.onParseError)
|
|
|
|
return;
|
|
|
|
const loc = (_a = token.location) !== null && _a !== void 0 ? _a : BASE_LOC;
|
|
|
|
const err = {
|
|
|
|
code,
|
|
|
|
startLine: loc.startLine,
|
|
|
|
startCol: loc.startCol,
|
|
|
|
startOffset: loc.startOffset,
|
|
|
|
endLine: beforeToken ? loc.startLine : loc.endLine,
|
|
|
|
endCol: beforeToken ? loc.startCol : loc.endCol,
|
|
|
|
endOffset: beforeToken ? loc.startOffset : loc.endOffset,
|
|
|
|
};
|
|
|
|
this.onParseError(err);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
//Stack events
|
|
|
|
onItemPush(node, tid, isTop) {
|
|
|
|
var _a, _b;
|
|
|
|
(_b = (_a = this.treeAdapter).onItemPush) === null || _b === void 0 ? void 0 : _b.call(_a, node);
|
|
|
|
if (isTop && this.openElements.stackTop > 0)
|
|
|
|
this._setContextModes(node, tid);
|
|
|
|
}
|
|
|
|
onItemPop(node, isTop) {
|
|
|
|
var _a, _b;
|
|
|
|
if (this.options.sourceCodeLocationInfo) {
|
|
|
|
this._setEndLocation(node, this.currentToken);
|
|
|
|
}
|
|
|
|
(_b = (_a = this.treeAdapter).onItemPop) === null || _b === void 0 ? void 0 : _b.call(_a, node, this.openElements.current);
|
|
|
|
if (isTop) {
|
|
|
|
let current;
|
|
|
|
let currentTagId;
|
|
|
|
if (this.openElements.stackTop === 0 && this.fragmentContext) {
|
|
|
|
current = this.fragmentContext;
|
|
|
|
currentTagId = this.fragmentContextID;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
else {
|
|
|
|
({ current, currentTagId } = this.openElements);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this._setContextModes(current, currentTagId);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_setContextModes(current, tid) {
|
|
|
|
const isHTML = current === this.document || this.treeAdapter.getNamespaceURI(current) === html_js_1.NS.HTML;
|
|
|
|
this.currentNotInHTML = !isHTML;
|
|
|
|
this.tokenizer.inForeignNode = !isHTML && !this._isIntegrationPoint(tid, current);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_switchToTextParsing(currentToken, nextTokenizerState) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this._insertElement(currentToken, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
this.tokenizer.state = nextTokenizerState;
|
|
|
|
this.originalInsertionMode = this.insertionMode;
|
2022-05-17 01:25:05 +00:00
|
|
|
this.insertionMode = InsertionMode.TEXT;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
switchToPlaintextParsing() {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.insertionMode = InsertionMode.TEXT;
|
|
|
|
this.originalInsertionMode = InsertionMode.IN_BODY;
|
|
|
|
this.tokenizer.state = index_js_1.TokenizerMode.PLAINTEXT;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Fragment parsing
|
|
|
|
_getAdjustedCurrentElement() {
|
|
|
|
return this.openElements.stackTop === 0 && this.fragmentContext
|
|
|
|
? this.fragmentContext
|
|
|
|
: this.openElements.current;
|
|
|
|
}
|
|
|
|
_findFormInFragmentContext() {
|
|
|
|
let node = this.fragmentContext;
|
2022-05-17 01:25:05 +00:00
|
|
|
while (node) {
|
|
|
|
if (this.treeAdapter.getTagName(node) === html_js_1.TAG_NAMES.FORM) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.formElement = node;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
node = this.treeAdapter.getParentNode(node);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_initTokenizerForFragmentParsing() {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (!this.fragmentContext || this.treeAdapter.getNamespaceURI(this.fragmentContext) !== html_js_1.NS.HTML) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
switch (this.fragmentContextID) {
|
|
|
|
case html_js_1.TAG_ID.TITLE:
|
|
|
|
case html_js_1.TAG_ID.TEXTAREA: {
|
|
|
|
this.tokenizer.state = index_js_1.TokenizerMode.RCDATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.STYLE:
|
|
|
|
case html_js_1.TAG_ID.XMP:
|
|
|
|
case html_js_1.TAG_ID.IFRAME:
|
|
|
|
case html_js_1.TAG_ID.NOEMBED:
|
|
|
|
case html_js_1.TAG_ID.NOFRAMES:
|
|
|
|
case html_js_1.TAG_ID.NOSCRIPT: {
|
|
|
|
this.tokenizer.state = index_js_1.TokenizerMode.RAWTEXT;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.SCRIPT: {
|
|
|
|
this.tokenizer.state = index_js_1.TokenizerMode.SCRIPT_DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.PLAINTEXT: {
|
|
|
|
this.tokenizer.state = index_js_1.TokenizerMode.PLAINTEXT;
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
default:
|
|
|
|
// Do nothing
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
//Tree mutation
|
|
|
|
_setDocumentType(token) {
|
|
|
|
const name = token.name || '';
|
|
|
|
const publicId = token.publicId || '';
|
|
|
|
const systemId = token.systemId || '';
|
|
|
|
this.treeAdapter.setDocumentType(this.document, name, publicId, systemId);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (token.location) {
|
|
|
|
const documentChildren = this.treeAdapter.getChildNodes(this.document);
|
|
|
|
const docTypeNode = documentChildren.find((node) => this.treeAdapter.isDocumentTypeNode(node));
|
|
|
|
if (docTypeNode) {
|
|
|
|
this.treeAdapter.setNodeSourceCodeLocation(docTypeNode, token.location);
|
|
|
|
}
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_attachElementToTree(element, location) {
|
|
|
|
if (this.options.sourceCodeLocationInfo) {
|
|
|
|
const loc = location && Object.assign(Object.assign({}, location), { startTag: location });
|
|
|
|
this.treeAdapter.setNodeSourceCodeLocation(element, loc);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
if (this._shouldFosterParentOnInsertion()) {
|
|
|
|
this._fosterParentElement(element);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
const parent = this.openElements.currentTmplContentOrNode;
|
2020-12-18 22:06:30 +00:00
|
|
|
this.treeAdapter.appendChild(parent, element);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
_appendElement(token, namespaceURI) {
|
|
|
|
const element = this.treeAdapter.createElement(token.tagName, namespaceURI, token.attrs);
|
2022-05-17 01:25:05 +00:00
|
|
|
this._attachElementToTree(element, token.location);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_insertElement(token, namespaceURI) {
|
|
|
|
const element = this.treeAdapter.createElement(token.tagName, namespaceURI, token.attrs);
|
2022-05-17 01:25:05 +00:00
|
|
|
this._attachElementToTree(element, token.location);
|
|
|
|
this.openElements.push(element, token.tagID);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_insertFakeElement(tagName, tagID) {
|
|
|
|
const element = this.treeAdapter.createElement(tagName, html_js_1.NS.HTML, []);
|
|
|
|
this._attachElementToTree(element, null);
|
|
|
|
this.openElements.push(element, tagID);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_insertTemplate(token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tmpl = this.treeAdapter.createElement(token.tagName, html_js_1.NS.HTML, token.attrs);
|
2020-12-18 22:06:30 +00:00
|
|
|
const content = this.treeAdapter.createDocumentFragment();
|
|
|
|
this.treeAdapter.setTemplateContent(tmpl, content);
|
2022-05-17 01:25:05 +00:00
|
|
|
this._attachElementToTree(tmpl, token.location);
|
|
|
|
this.openElements.push(tmpl, token.tagID);
|
|
|
|
if (this.options.sourceCodeLocationInfo)
|
|
|
|
this.treeAdapter.setNodeSourceCodeLocation(content, null);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_insertFakeRootElement() {
|
2022-05-17 01:25:05 +00:00
|
|
|
const element = this.treeAdapter.createElement(html_js_1.TAG_NAMES.HTML, html_js_1.NS.HTML, []);
|
|
|
|
if (this.options.sourceCodeLocationInfo)
|
|
|
|
this.treeAdapter.setNodeSourceCodeLocation(element, null);
|
2020-12-18 22:06:30 +00:00
|
|
|
this.treeAdapter.appendChild(this.openElements.current, element);
|
2022-05-17 01:25:05 +00:00
|
|
|
this.openElements.push(element, html_js_1.TAG_ID.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_appendCommentNode(token, parent) {
|
|
|
|
const commentNode = this.treeAdapter.createCommentNode(token.data);
|
|
|
|
this.treeAdapter.appendChild(parent, commentNode);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (this.options.sourceCodeLocationInfo) {
|
|
|
|
this.treeAdapter.setNodeSourceCodeLocation(commentNode, token.location);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_insertCharacters(token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
let parent;
|
|
|
|
let beforeElement;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (this._shouldFosterParentOnInsertion()) {
|
2022-05-17 01:25:05 +00:00
|
|
|
({ parent, beforeElement } = this._findFosterParentingLocation());
|
|
|
|
if (beforeElement) {
|
|
|
|
this.treeAdapter.insertTextBefore(parent, token.chars, beforeElement);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this.treeAdapter.insertText(parent, token.chars);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
parent = this.openElements.currentTmplContentOrNode;
|
2020-12-18 22:06:30 +00:00
|
|
|
this.treeAdapter.insertText(parent, token.chars);
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (!token.location)
|
|
|
|
return;
|
|
|
|
const siblings = this.treeAdapter.getChildNodes(parent);
|
|
|
|
const textNodeIdx = beforeElement ? siblings.lastIndexOf(beforeElement) : siblings.length;
|
|
|
|
const textNode = siblings[textNodeIdx - 1];
|
|
|
|
//NOTE: if we have a location assigned by another token, then just update the end position
|
|
|
|
const tnLoc = this.treeAdapter.getNodeSourceCodeLocation(textNode);
|
|
|
|
if (tnLoc) {
|
|
|
|
const { endLine, endCol, endOffset } = token.location;
|
|
|
|
this.treeAdapter.updateNodeSourceCodeLocation(textNode, { endLine, endCol, endOffset });
|
|
|
|
}
|
|
|
|
else if (this.options.sourceCodeLocationInfo) {
|
|
|
|
this.treeAdapter.setNodeSourceCodeLocation(textNode, token.location);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_adoptNodes(donor, recipient) {
|
|
|
|
for (let child = this.treeAdapter.getFirstChild(donor); child; child = this.treeAdapter.getFirstChild(donor)) {
|
|
|
|
this.treeAdapter.detachNode(child);
|
|
|
|
this.treeAdapter.appendChild(recipient, child);
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_setEndLocation(element, closingToken) {
|
|
|
|
if (this.treeAdapter.getNodeSourceCodeLocation(element) && closingToken.location) {
|
|
|
|
const ctLoc = closingToken.location;
|
|
|
|
const tn = this.treeAdapter.getTagName(element);
|
|
|
|
const endLoc =
|
|
|
|
// NOTE: For cases like <p> <p> </p> - First 'p' closes without a closing
|
|
|
|
// tag and for cases like <td> <p> </td> - 'p' closes without a closing tag.
|
|
|
|
closingToken.type === token_js_1.TokenType.END_TAG && tn === closingToken.tagName
|
|
|
|
? {
|
|
|
|
endTag: Object.assign({}, ctLoc),
|
|
|
|
endLine: ctLoc.endLine,
|
|
|
|
endCol: ctLoc.endCol,
|
|
|
|
endOffset: ctLoc.endOffset,
|
|
|
|
}
|
|
|
|
: {
|
|
|
|
endLine: ctLoc.startLine,
|
|
|
|
endCol: ctLoc.startCol,
|
|
|
|
endOffset: ctLoc.startOffset,
|
|
|
|
};
|
|
|
|
this.treeAdapter.updateNodeSourceCodeLocation(element, endLoc);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
//Token processing
|
|
|
|
shouldProcessStartTagTokenInForeignContent(token) {
|
|
|
|
// Check that neither current === document, or ns === NS.HTML
|
|
|
|
if (!this.currentNotInHTML)
|
2020-12-18 22:06:30 +00:00
|
|
|
return false;
|
2022-05-17 01:25:05 +00:00
|
|
|
let current;
|
|
|
|
let currentTagId;
|
|
|
|
if (this.openElements.stackTop === 0 && this.fragmentContext) {
|
|
|
|
current = this.fragmentContext;
|
|
|
|
currentTagId = this.fragmentContextID;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
({ current, currentTagId } = this.openElements);
|
|
|
|
}
|
|
|
|
if (token.tagID === html_js_1.TAG_ID.SVG &&
|
|
|
|
this.treeAdapter.getTagName(current) === html_js_1.TAG_NAMES.ANNOTATION_XML &&
|
|
|
|
this.treeAdapter.getNamespaceURI(current) === html_js_1.NS.MATHML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return false;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
return (
|
|
|
|
// Check that `current` is not an integration point for HTML or MathML elements.
|
|
|
|
this.tokenizer.inForeignNode ||
|
|
|
|
// If it _is_ an integration point, then we might have to check that it is not an HTML
|
|
|
|
// integration point.
|
|
|
|
((token.tagID === html_js_1.TAG_ID.MGLYPH || token.tagID === html_js_1.TAG_ID.MALIGNMARK) &&
|
|
|
|
!this._isIntegrationPoint(currentTagId, current, html_js_1.NS.HTML)));
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_processToken(token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.type) {
|
|
|
|
case token_js_1.TokenType.CHARACTER: {
|
|
|
|
this.onCharacter(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.NULL_CHARACTER: {
|
|
|
|
this.onNullCharacter(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.COMMENT: {
|
|
|
|
this.onComment(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.DOCTYPE: {
|
|
|
|
this.onDoctype(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.START_TAG: {
|
|
|
|
this._processStartTag(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.END_TAG: {
|
|
|
|
this.onEndTag(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.EOF: {
|
|
|
|
this.onEof(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.WHITESPACE_CHARACTER: {
|
|
|
|
this.onWhitespaceCharacter(token);
|
|
|
|
break;
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
//Integration points
|
2022-05-17 01:25:05 +00:00
|
|
|
_isIntegrationPoint(tid, element, foreignNS) {
|
2020-12-18 22:06:30 +00:00
|
|
|
const ns = this.treeAdapter.getNamespaceURI(element);
|
|
|
|
const attrs = this.treeAdapter.getAttrList(element);
|
2022-05-17 01:25:05 +00:00
|
|
|
return foreignContent.isIntegrationPoint(tid, ns, attrs, foreignNS);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Active formatting elements reconstruction
|
|
|
|
_reconstructActiveFormattingElements() {
|
2022-05-17 01:25:05 +00:00
|
|
|
const listLength = this.activeFormattingElements.entries.length;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (listLength) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const endIndex = this.activeFormattingElements.entries.findIndex((entry) => entry.type === formatting_element_list_js_1.EntryType.Marker || this.openElements.contains(entry.element));
|
|
|
|
const unopenIdx = endIndex < 0 ? listLength - 1 : endIndex - 1;
|
|
|
|
for (let i = unopenIdx; i >= 0; i--) {
|
|
|
|
const entry = this.activeFormattingElements.entries[i];
|
2020-12-18 22:06:30 +00:00
|
|
|
this._insertElement(entry.token, this.treeAdapter.getNamespaceURI(entry.element));
|
|
|
|
entry.element = this.openElements.current;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
//Close elements
|
|
|
|
_closeTableCell() {
|
|
|
|
this.openElements.generateImpliedEndTags();
|
|
|
|
this.openElements.popUntilTableCellPopped();
|
|
|
|
this.activeFormattingElements.clearToLastMarker();
|
2022-05-17 01:25:05 +00:00
|
|
|
this.insertionMode = InsertionMode.IN_ROW;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_closePElement() {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.openElements.generateImpliedEndTagsWithExclusion(html_js_1.TAG_ID.P);
|
|
|
|
this.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.P);
|
|
|
|
}
|
|
|
|
//Insertion modes
|
|
|
|
_resetInsertionMode() {
|
|
|
|
for (let i = this.openElements.stackTop; i >= 0; i--) {
|
|
|
|
//Insertion mode reset map
|
|
|
|
switch (i === 0 && this.fragmentContext ? this.fragmentContextID : this.openElements.tagIDs[i]) {
|
|
|
|
case html_js_1.TAG_ID.TR:
|
|
|
|
this.insertionMode = InsertionMode.IN_ROW;
|
|
|
|
return;
|
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.THEAD:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
this.insertionMode = InsertionMode.IN_TABLE_BODY;
|
|
|
|
return;
|
|
|
|
case html_js_1.TAG_ID.CAPTION:
|
|
|
|
this.insertionMode = InsertionMode.IN_CAPTION;
|
|
|
|
return;
|
|
|
|
case html_js_1.TAG_ID.COLGROUP:
|
|
|
|
this.insertionMode = InsertionMode.IN_COLUMN_GROUP;
|
|
|
|
return;
|
|
|
|
case html_js_1.TAG_ID.TABLE:
|
|
|
|
this.insertionMode = InsertionMode.IN_TABLE;
|
|
|
|
return;
|
|
|
|
case html_js_1.TAG_ID.BODY:
|
|
|
|
this.insertionMode = InsertionMode.IN_BODY;
|
|
|
|
return;
|
|
|
|
case html_js_1.TAG_ID.FRAMESET:
|
|
|
|
this.insertionMode = InsertionMode.IN_FRAMESET;
|
|
|
|
return;
|
|
|
|
case html_js_1.TAG_ID.SELECT:
|
|
|
|
this._resetInsertionModeForSelect(i);
|
|
|
|
return;
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE:
|
|
|
|
this.insertionMode = this.tmplInsertionModeStack[0];
|
|
|
|
return;
|
|
|
|
case html_js_1.TAG_ID.HTML:
|
|
|
|
this.insertionMode = this.headElement ? InsertionMode.AFTER_HEAD : InsertionMode.BEFORE_HEAD;
|
|
|
|
return;
|
|
|
|
case html_js_1.TAG_ID.TD:
|
|
|
|
case html_js_1.TAG_ID.TH:
|
|
|
|
if (i > 0) {
|
|
|
|
this.insertionMode = InsertionMode.IN_CELL;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case html_js_1.TAG_ID.HEAD:
|
|
|
|
if (i > 0) {
|
|
|
|
this.insertionMode = InsertionMode.IN_HEAD;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.insertionMode = InsertionMode.IN_BODY;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_resetInsertionModeForSelect(selectIdx) {
|
|
|
|
if (selectIdx > 0) {
|
|
|
|
for (let i = selectIdx - 1; i > 0; i--) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = this.openElements.tagIDs[i];
|
|
|
|
if (tn === html_js_1.TAG_ID.TEMPLATE) {
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else if (tn === html_js_1.TAG_ID.TABLE) {
|
|
|
|
this.insertionMode = InsertionMode.IN_SELECT_IN_TABLE;
|
2020-12-18 22:06:30 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.insertionMode = InsertionMode.IN_SELECT;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Foster parenting
|
2022-05-17 01:25:05 +00:00
|
|
|
_isElementCausesFosterParenting(tn) {
|
|
|
|
return TABLE_STRUCTURE_TAGS.has(tn);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_shouldFosterParentOnInsertion() {
|
2022-05-17 01:25:05 +00:00
|
|
|
return this.fosterParentingEnabled && this._isElementCausesFosterParenting(this.openElements.currentTagId);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_findFosterParentingLocation() {
|
|
|
|
for (let i = this.openElements.stackTop; i >= 0; i--) {
|
|
|
|
const openElement = this.openElements.items[i];
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (this.openElements.tagIDs[i]) {
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE:
|
|
|
|
if (this.treeAdapter.getNamespaceURI(openElement) === html_js_1.NS.HTML) {
|
|
|
|
return { parent: this.treeAdapter.getTemplateContent(openElement), beforeElement: null };
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case html_js_1.TAG_ID.TABLE: {
|
|
|
|
const parent = this.treeAdapter.getParentNode(openElement);
|
|
|
|
if (parent) {
|
|
|
|
return { parent, beforeElement: openElement };
|
|
|
|
}
|
|
|
|
return { parent: this.openElements.items[i - 1], beforeElement: null };
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
default:
|
|
|
|
// Do nothing
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
return { parent: this.openElements.items[0], beforeElement: null };
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_fosterParentElement(element) {
|
|
|
|
const location = this._findFosterParentingLocation();
|
|
|
|
if (location.beforeElement) {
|
|
|
|
this.treeAdapter.insertBefore(location.parent, element, location.beforeElement);
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
else {
|
|
|
|
this.treeAdapter.appendChild(location.parent, element);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
//Special elements
|
2022-05-17 01:25:05 +00:00
|
|
|
_isSpecialElement(element, id) {
|
2020-12-18 22:06:30 +00:00
|
|
|
const ns = this.treeAdapter.getNamespaceURI(element);
|
2022-05-17 01:25:05 +00:00
|
|
|
return html_js_1.SPECIAL_ELEMENTS[ns].has(id);
|
|
|
|
}
|
|
|
|
onCharacter(token) {
|
|
|
|
this.skipNextNewLine = false;
|
|
|
|
if (this.tokenizer.inForeignNode) {
|
|
|
|
characterInForeignContent(this, token);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
switch (this.insertionMode) {
|
|
|
|
case InsertionMode.INITIAL:
|
|
|
|
tokenInInitialMode(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HTML:
|
|
|
|
tokenBeforeHtml(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HEAD:
|
|
|
|
tokenBeforeHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_HEAD:
|
|
|
|
tokenInHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_HEAD_NO_SCRIPT:
|
|
|
|
tokenInHeadNoScript(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_HEAD:
|
|
|
|
tokenAfterHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_BODY:
|
|
|
|
case InsertionMode.IN_CAPTION:
|
|
|
|
case InsertionMode.IN_CELL:
|
|
|
|
case InsertionMode.IN_TEMPLATE:
|
|
|
|
characterInBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.TEXT:
|
|
|
|
case InsertionMode.IN_SELECT:
|
|
|
|
case InsertionMode.IN_SELECT_IN_TABLE:
|
|
|
|
this._insertCharacters(token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE:
|
|
|
|
case InsertionMode.IN_TABLE_BODY:
|
|
|
|
case InsertionMode.IN_ROW:
|
|
|
|
characterInTable(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE_TEXT:
|
|
|
|
characterInTableText(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_COLUMN_GROUP:
|
|
|
|
tokenInColumnGroup(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_BODY:
|
|
|
|
tokenAfterBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_AFTER_BODY:
|
|
|
|
tokenAfterAfterBody(this, token);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Do nothing
|
|
|
|
}
|
|
|
|
}
|
|
|
|
onNullCharacter(token) {
|
|
|
|
this.skipNextNewLine = false;
|
|
|
|
if (this.tokenizer.inForeignNode) {
|
|
|
|
nullCharacterInForeignContent(this, token);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
switch (this.insertionMode) {
|
|
|
|
case InsertionMode.INITIAL:
|
|
|
|
tokenInInitialMode(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HTML:
|
|
|
|
tokenBeforeHtml(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HEAD:
|
|
|
|
tokenBeforeHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_HEAD:
|
|
|
|
tokenInHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_HEAD_NO_SCRIPT:
|
|
|
|
tokenInHeadNoScript(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_HEAD:
|
|
|
|
tokenAfterHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.TEXT:
|
|
|
|
this._insertCharacters(token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE:
|
|
|
|
case InsertionMode.IN_TABLE_BODY:
|
|
|
|
case InsertionMode.IN_ROW:
|
|
|
|
characterInTable(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_COLUMN_GROUP:
|
|
|
|
tokenInColumnGroup(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_BODY:
|
|
|
|
tokenAfterBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_AFTER_BODY:
|
|
|
|
tokenAfterAfterBody(this, token);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Do nothing
|
|
|
|
}
|
|
|
|
}
|
|
|
|
onComment(token) {
|
|
|
|
this.skipNextNewLine = false;
|
|
|
|
if (this.currentNotInHTML) {
|
|
|
|
appendComment(this, token);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
switch (this.insertionMode) {
|
|
|
|
case InsertionMode.INITIAL:
|
|
|
|
case InsertionMode.BEFORE_HTML:
|
|
|
|
case InsertionMode.BEFORE_HEAD:
|
|
|
|
case InsertionMode.IN_HEAD:
|
|
|
|
case InsertionMode.IN_HEAD_NO_SCRIPT:
|
|
|
|
case InsertionMode.AFTER_HEAD:
|
|
|
|
case InsertionMode.IN_BODY:
|
|
|
|
case InsertionMode.IN_TABLE:
|
|
|
|
case InsertionMode.IN_CAPTION:
|
|
|
|
case InsertionMode.IN_COLUMN_GROUP:
|
|
|
|
case InsertionMode.IN_TABLE_BODY:
|
|
|
|
case InsertionMode.IN_ROW:
|
|
|
|
case InsertionMode.IN_CELL:
|
|
|
|
case InsertionMode.IN_SELECT:
|
|
|
|
case InsertionMode.IN_SELECT_IN_TABLE:
|
|
|
|
case InsertionMode.IN_TEMPLATE:
|
|
|
|
case InsertionMode.IN_FRAMESET:
|
|
|
|
case InsertionMode.AFTER_FRAMESET:
|
|
|
|
appendComment(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE_TEXT:
|
|
|
|
tokenInTableText(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_BODY:
|
|
|
|
appendCommentToRootHtmlElement(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_AFTER_BODY:
|
|
|
|
case InsertionMode.AFTER_AFTER_FRAMESET:
|
|
|
|
appendCommentToDocument(this, token);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Do nothing
|
|
|
|
}
|
|
|
|
}
|
|
|
|
onDoctype(token) {
|
|
|
|
this.skipNextNewLine = false;
|
|
|
|
switch (this.insertionMode) {
|
|
|
|
case InsertionMode.INITIAL:
|
|
|
|
doctypeInInitialMode(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HEAD:
|
|
|
|
case InsertionMode.IN_HEAD:
|
|
|
|
case InsertionMode.IN_HEAD_NO_SCRIPT:
|
|
|
|
case InsertionMode.AFTER_HEAD:
|
|
|
|
this._err(token, error_codes_js_1.ERR.misplacedDoctype);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE_TEXT:
|
|
|
|
tokenInTableText(this, token);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Do nothing
|
|
|
|
}
|
|
|
|
}
|
|
|
|
onStartTag(token) {
|
|
|
|
this.skipNextNewLine = false;
|
|
|
|
this.currentToken = token;
|
|
|
|
this._processStartTag(token);
|
|
|
|
if (token.selfClosing && !token.ackSelfClosing) {
|
|
|
|
this._err(token, error_codes_js_1.ERR.nonVoidHtmlElementStartTagWithTrailingSolidus);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/**
|
|
|
|
* Processes a given start tag.
|
|
|
|
*
|
|
|
|
* `onStartTag` checks if a self-closing tag was recognized. When a token
|
|
|
|
* is moved inbetween multiple insertion modes, this check for self-closing
|
|
|
|
* could lead to false positives. To avoid this, `_processStartTag` is used
|
|
|
|
* for nested calls.
|
|
|
|
*
|
|
|
|
* @param token The token to process.
|
|
|
|
*/
|
|
|
|
_processStartTag(token) {
|
|
|
|
if (this.shouldProcessStartTagTokenInForeignContent(token)) {
|
|
|
|
startTagInForeignContent(this, token);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._startTagOutsideForeignContent(token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
_startTagOutsideForeignContent(token) {
|
|
|
|
switch (this.insertionMode) {
|
|
|
|
case InsertionMode.INITIAL:
|
|
|
|
tokenInInitialMode(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HTML:
|
|
|
|
startTagBeforeHtml(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HEAD:
|
|
|
|
startTagBeforeHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_HEAD:
|
|
|
|
startTagInHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_HEAD_NO_SCRIPT:
|
|
|
|
startTagInHeadNoScript(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_HEAD:
|
|
|
|
startTagAfterHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_BODY:
|
|
|
|
startTagInBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE:
|
|
|
|
startTagInTable(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE_TEXT:
|
|
|
|
tokenInTableText(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_CAPTION:
|
|
|
|
startTagInCaption(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_COLUMN_GROUP:
|
|
|
|
startTagInColumnGroup(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE_BODY:
|
|
|
|
startTagInTableBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_ROW:
|
|
|
|
startTagInRow(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_CELL:
|
|
|
|
startTagInCell(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_SELECT:
|
|
|
|
startTagInSelect(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_SELECT_IN_TABLE:
|
|
|
|
startTagInSelectInTable(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TEMPLATE:
|
|
|
|
startTagInTemplate(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_BODY:
|
|
|
|
startTagAfterBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_FRAMESET:
|
|
|
|
startTagInFrameset(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_FRAMESET:
|
|
|
|
startTagAfterFrameset(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_AFTER_BODY:
|
|
|
|
startTagAfterAfterBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_AFTER_FRAMESET:
|
|
|
|
startTagAfterAfterFrameset(this, token);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Do nothing
|
|
|
|
}
|
|
|
|
}
|
|
|
|
onEndTag(token) {
|
|
|
|
this.skipNextNewLine = false;
|
|
|
|
this.currentToken = token;
|
|
|
|
if (this.currentNotInHTML) {
|
|
|
|
endTagInForeignContent(this, token);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._endTagOutsideForeignContent(token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
_endTagOutsideForeignContent(token) {
|
|
|
|
switch (this.insertionMode) {
|
|
|
|
case InsertionMode.INITIAL:
|
|
|
|
tokenInInitialMode(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HTML:
|
|
|
|
endTagBeforeHtml(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HEAD:
|
|
|
|
endTagBeforeHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_HEAD:
|
|
|
|
endTagInHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_HEAD_NO_SCRIPT:
|
|
|
|
endTagInHeadNoScript(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_HEAD:
|
|
|
|
endTagAfterHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_BODY:
|
|
|
|
endTagInBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.TEXT:
|
|
|
|
endTagInText(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE:
|
|
|
|
endTagInTable(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE_TEXT:
|
|
|
|
tokenInTableText(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_CAPTION:
|
|
|
|
endTagInCaption(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_COLUMN_GROUP:
|
|
|
|
endTagInColumnGroup(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE_BODY:
|
|
|
|
endTagInTableBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_ROW:
|
|
|
|
endTagInRow(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_CELL:
|
|
|
|
endTagInCell(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_SELECT:
|
|
|
|
endTagInSelect(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_SELECT_IN_TABLE:
|
|
|
|
endTagInSelectInTable(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TEMPLATE:
|
|
|
|
endTagInTemplate(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_BODY:
|
|
|
|
endTagAfterBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_FRAMESET:
|
|
|
|
endTagInFrameset(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_FRAMESET:
|
|
|
|
endTagAfterFrameset(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_AFTER_BODY:
|
|
|
|
tokenAfterAfterBody(this, token);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Do nothing
|
|
|
|
}
|
|
|
|
}
|
|
|
|
onEof(token) {
|
|
|
|
switch (this.insertionMode) {
|
|
|
|
case InsertionMode.INITIAL:
|
|
|
|
tokenInInitialMode(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HTML:
|
|
|
|
tokenBeforeHtml(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.BEFORE_HEAD:
|
|
|
|
tokenBeforeHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_HEAD:
|
|
|
|
tokenInHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_HEAD_NO_SCRIPT:
|
|
|
|
tokenInHeadNoScript(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_HEAD:
|
|
|
|
tokenAfterHead(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_BODY:
|
|
|
|
case InsertionMode.IN_TABLE:
|
|
|
|
case InsertionMode.IN_CAPTION:
|
|
|
|
case InsertionMode.IN_COLUMN_GROUP:
|
|
|
|
case InsertionMode.IN_TABLE_BODY:
|
|
|
|
case InsertionMode.IN_ROW:
|
|
|
|
case InsertionMode.IN_CELL:
|
|
|
|
case InsertionMode.IN_SELECT:
|
|
|
|
case InsertionMode.IN_SELECT_IN_TABLE:
|
|
|
|
eofInBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.TEXT:
|
|
|
|
eofInText(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE_TEXT:
|
|
|
|
tokenInTableText(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TEMPLATE:
|
|
|
|
eofInTemplate(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.AFTER_BODY:
|
|
|
|
case InsertionMode.IN_FRAMESET:
|
|
|
|
case InsertionMode.AFTER_FRAMESET:
|
|
|
|
case InsertionMode.AFTER_AFTER_BODY:
|
|
|
|
case InsertionMode.AFTER_AFTER_FRAMESET:
|
|
|
|
stopParsing(this, token);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Do nothing
|
|
|
|
}
|
|
|
|
}
|
|
|
|
onWhitespaceCharacter(token) {
|
|
|
|
if (this.skipNextNewLine) {
|
|
|
|
this.skipNextNewLine = false;
|
|
|
|
if (token.chars.charCodeAt(0) === unicode.CODE_POINTS.LINE_FEED) {
|
|
|
|
if (token.chars.length === 1) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
token.chars = token.chars.substr(1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (this.tokenizer.inForeignNode) {
|
|
|
|
this._insertCharacters(token);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
switch (this.insertionMode) {
|
|
|
|
case InsertionMode.IN_HEAD:
|
|
|
|
case InsertionMode.IN_HEAD_NO_SCRIPT:
|
|
|
|
case InsertionMode.AFTER_HEAD:
|
|
|
|
case InsertionMode.TEXT:
|
|
|
|
case InsertionMode.IN_COLUMN_GROUP:
|
|
|
|
case InsertionMode.IN_SELECT:
|
|
|
|
case InsertionMode.IN_SELECT_IN_TABLE:
|
|
|
|
case InsertionMode.IN_FRAMESET:
|
|
|
|
case InsertionMode.AFTER_FRAMESET:
|
|
|
|
this._insertCharacters(token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_BODY:
|
|
|
|
case InsertionMode.IN_CAPTION:
|
|
|
|
case InsertionMode.IN_CELL:
|
|
|
|
case InsertionMode.IN_TEMPLATE:
|
|
|
|
case InsertionMode.AFTER_BODY:
|
|
|
|
case InsertionMode.AFTER_AFTER_BODY:
|
|
|
|
case InsertionMode.AFTER_AFTER_FRAMESET:
|
|
|
|
whitespaceCharacterInBody(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE:
|
|
|
|
case InsertionMode.IN_TABLE_BODY:
|
|
|
|
case InsertionMode.IN_ROW:
|
|
|
|
characterInTable(this, token);
|
|
|
|
break;
|
|
|
|
case InsertionMode.IN_TABLE_TEXT:
|
|
|
|
whitespaceCharacterInTableText(this, token);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Do nothing
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
exports.Parser = Parser;
|
2020-12-18 22:06:30 +00:00
|
|
|
//Adoption agency algorithm
|
|
|
|
//(see: http://www.whatwg.org/specs/web-apps/current-work/multipage/tree-construction.html#adoptionAgency)
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
//Steps 5-8 of the algorithm
|
|
|
|
function aaObtainFormattingElementEntry(p, token) {
|
|
|
|
let formattingElementEntry = p.activeFormattingElements.getElementEntryInScopeWithTagName(token.tagName);
|
|
|
|
if (formattingElementEntry) {
|
|
|
|
if (!p.openElements.contains(formattingElementEntry.element)) {
|
|
|
|
p.activeFormattingElements.removeEntry(formattingElementEntry);
|
|
|
|
formattingElementEntry = null;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else if (!p.openElements.hasInScope(token.tagID)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
formattingElementEntry = null;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
genericEndTagInBody(p, token);
|
|
|
|
}
|
|
|
|
return formattingElementEntry;
|
|
|
|
}
|
|
|
|
//Steps 9 and 10 of the algorithm
|
|
|
|
function aaObtainFurthestBlock(p, formattingElementEntry) {
|
|
|
|
let furthestBlock = null;
|
2022-05-17 01:25:05 +00:00
|
|
|
let idx = p.openElements.stackTop;
|
|
|
|
for (; idx >= 0; idx--) {
|
|
|
|
const element = p.openElements.items[idx];
|
2020-12-18 22:06:30 +00:00
|
|
|
if (element === formattingElementEntry.element) {
|
|
|
|
break;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p._isSpecialElement(element, p.openElements.tagIDs[idx])) {
|
2020-12-18 22:06:30 +00:00
|
|
|
furthestBlock = element;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (!furthestBlock) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p.openElements.shortenToLength(idx < 0 ? 0 : idx);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.activeFormattingElements.removeEntry(formattingElementEntry);
|
|
|
|
}
|
|
|
|
return furthestBlock;
|
|
|
|
}
|
|
|
|
//Step 13 of the algorithm
|
|
|
|
function aaInnerLoop(p, furthestBlock, formattingElement) {
|
|
|
|
let lastElement = furthestBlock;
|
|
|
|
let nextElement = p.openElements.getCommonAncestor(furthestBlock);
|
|
|
|
for (let i = 0, element = nextElement; element !== formattingElement; i++, element = nextElement) {
|
2022-05-17 01:25:05 +00:00
|
|
|
//NOTE: store the next element for the next loop iteration (it may be deleted from the stack by step 9.5)
|
2020-12-18 22:06:30 +00:00
|
|
|
nextElement = p.openElements.getCommonAncestor(element);
|
|
|
|
const elementEntry = p.activeFormattingElements.getElementEntry(element);
|
|
|
|
const counterOverflow = elementEntry && i >= AA_INNER_LOOP_ITER;
|
|
|
|
const shouldRemoveFromOpenElements = !elementEntry || counterOverflow;
|
|
|
|
if (shouldRemoveFromOpenElements) {
|
|
|
|
if (counterOverflow) {
|
|
|
|
p.activeFormattingElements.removeEntry(elementEntry);
|
|
|
|
}
|
|
|
|
p.openElements.remove(element);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
element = aaRecreateElementFromEntry(p, elementEntry);
|
|
|
|
if (lastElement === furthestBlock) {
|
|
|
|
p.activeFormattingElements.bookmark = elementEntry;
|
|
|
|
}
|
|
|
|
p.treeAdapter.detachNode(lastElement);
|
|
|
|
p.treeAdapter.appendChild(element, lastElement);
|
|
|
|
lastElement = element;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return lastElement;
|
|
|
|
}
|
|
|
|
//Step 13.7 of the algorithm
|
|
|
|
function aaRecreateElementFromEntry(p, elementEntry) {
|
|
|
|
const ns = p.treeAdapter.getNamespaceURI(elementEntry.element);
|
|
|
|
const newElement = p.treeAdapter.createElement(elementEntry.token.tagName, ns, elementEntry.token.attrs);
|
|
|
|
p.openElements.replace(elementEntry.element, newElement);
|
|
|
|
elementEntry.element = newElement;
|
|
|
|
return newElement;
|
|
|
|
}
|
|
|
|
//Step 14 of the algorithm
|
|
|
|
function aaInsertLastNodeInCommonAncestor(p, commonAncestor, lastElement) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = p.treeAdapter.getTagName(commonAncestor);
|
|
|
|
const tid = (0, html_js_1.getTagID)(tn);
|
|
|
|
if (p._isElementCausesFosterParenting(tid)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._fosterParentElement(lastElement);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
const ns = p.treeAdapter.getNamespaceURI(commonAncestor);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (tid === html_js_1.TAG_ID.TEMPLATE && ns === html_js_1.NS.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
commonAncestor = p.treeAdapter.getTemplateContent(commonAncestor);
|
|
|
|
}
|
|
|
|
p.treeAdapter.appendChild(commonAncestor, lastElement);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
//Steps 15-19 of the algorithm
|
|
|
|
function aaReplaceFormattingElement(p, furthestBlock, formattingElementEntry) {
|
|
|
|
const ns = p.treeAdapter.getNamespaceURI(formattingElementEntry.element);
|
2022-05-17 01:25:05 +00:00
|
|
|
const { token } = formattingElementEntry;
|
2020-12-18 22:06:30 +00:00
|
|
|
const newElement = p.treeAdapter.createElement(token.tagName, ns, token.attrs);
|
|
|
|
p._adoptNodes(furthestBlock, newElement);
|
|
|
|
p.treeAdapter.appendChild(furthestBlock, newElement);
|
2022-05-17 01:25:05 +00:00
|
|
|
p.activeFormattingElements.insertElementAfterBookmark(newElement, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.activeFormattingElements.removeEntry(formattingElementEntry);
|
|
|
|
p.openElements.remove(formattingElementEntry.element);
|
2022-05-17 01:25:05 +00:00
|
|
|
p.openElements.insertAfter(furthestBlock, newElement, token.tagID);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Algorithm entry point
|
|
|
|
function callAdoptionAgency(p, token) {
|
|
|
|
for (let i = 0; i < AA_OUTER_LOOP_ITER; i++) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const formattingElementEntry = aaObtainFormattingElementEntry(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
if (!formattingElementEntry) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
const furthestBlock = aaObtainFurthestBlock(p, formattingElementEntry);
|
|
|
|
if (!furthestBlock) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
p.activeFormattingElements.bookmark = formattingElementEntry;
|
|
|
|
const lastElement = aaInnerLoop(p, furthestBlock, formattingElementEntry.element);
|
|
|
|
const commonAncestor = p.openElements.getCommonAncestor(formattingElementEntry.element);
|
|
|
|
p.treeAdapter.detachNode(lastElement);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (commonAncestor)
|
|
|
|
aaInsertLastNodeInCommonAncestor(p, commonAncestor, lastElement);
|
2020-12-18 22:06:30 +00:00
|
|
|
aaReplaceFormattingElement(p, furthestBlock, formattingElementEntry);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
//Generic token handlers
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function appendComment(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._appendCommentNode(token, p.openElements.currentTmplContentOrNode);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function appendCommentToRootHtmlElement(p, token) {
|
|
|
|
p._appendCommentNode(token, p.openElements.items[0]);
|
|
|
|
}
|
|
|
|
function appendCommentToDocument(p, token) {
|
|
|
|
p._appendCommentNode(token, p.document);
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
function stopParsing(p, token) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.stopped = true;
|
2022-05-17 01:25:05 +00:00
|
|
|
// NOTE: Set end locations for elements that remain on the open element stack.
|
|
|
|
if (token.location) {
|
|
|
|
// NOTE: If we are not in a fragment, `html` and `body` will stay on the stack.
|
|
|
|
// This is a problem, as we might overwrite their end position here.
|
|
|
|
const target = p.fragmentContext ? 0 : 2;
|
|
|
|
for (let i = p.openElements.stackTop; i >= target; i--) {
|
|
|
|
p._setEndLocation(p.openElements.items[i], token);
|
|
|
|
}
|
|
|
|
// Handle `html` and `body`
|
|
|
|
if (!p.fragmentContext && p.openElements.stackTop >= 0) {
|
|
|
|
const htmlElement = p.openElements.items[0];
|
|
|
|
const htmlLocation = p.treeAdapter.getNodeSourceCodeLocation(htmlElement);
|
|
|
|
if (htmlLocation && !htmlLocation.endTag) {
|
|
|
|
p._setEndLocation(htmlElement, token);
|
|
|
|
if (p.openElements.stackTop >= 1) {
|
|
|
|
const bodyElement = p.openElements.items[1];
|
|
|
|
const bodyLocation = p.treeAdapter.getNodeSourceCodeLocation(bodyElement);
|
|
|
|
if (bodyLocation && !bodyLocation.endTag) {
|
|
|
|
p._setEndLocation(bodyElement, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
// The "initial" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function doctypeInInitialMode(p, token) {
|
|
|
|
p._setDocumentType(token);
|
2022-05-17 01:25:05 +00:00
|
|
|
const mode = token.forceQuirks ? html_js_1.DOCUMENT_MODE.QUIRKS : doctype.getDocumentMode(token);
|
2020-12-18 22:06:30 +00:00
|
|
|
if (!doctype.isConforming(token)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._err(token, error_codes_js_1.ERR.nonConformingDoctype);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
p.treeAdapter.setDocumentMode(p.document, mode);
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.BEFORE_HTML;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function tokenInInitialMode(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._err(token, error_codes_js_1.ERR.missingDoctype, true);
|
|
|
|
p.treeAdapter.setDocumentMode(p.document, html_js_1.DOCUMENT_MODE.QUIRKS);
|
|
|
|
p.insertionMode = InsertionMode.BEFORE_HTML;
|
2020-12-18 22:06:30 +00:00
|
|
|
p._processToken(token);
|
|
|
|
}
|
|
|
|
// The "before html" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagBeforeHtml(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (token.tagID === html_js_1.TAG_ID.HTML) {
|
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.insertionMode = InsertionMode.BEFORE_HEAD;
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
tokenBeforeHtml(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagBeforeHtml(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
|
|
|
if (tn === html_js_1.TAG_ID.HTML || tn === html_js_1.TAG_ID.HEAD || tn === html_js_1.TAG_ID.BODY || tn === html_js_1.TAG_ID.BR) {
|
2020-12-18 22:06:30 +00:00
|
|
|
tokenBeforeHtml(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function tokenBeforeHtml(p, token) {
|
|
|
|
p._insertFakeRootElement();
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.BEFORE_HEAD;
|
2020-12-18 22:06:30 +00:00
|
|
|
p._processToken(token);
|
|
|
|
}
|
|
|
|
// The "before head" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagBeforeHead(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
startTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.HEAD: {
|
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.headElement = p.openElements.current;
|
|
|
|
p.insertionMode = InsertionMode.IN_HEAD;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
tokenBeforeHead(p, token);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagBeforeHead(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
|
|
|
if (tn === html_js_1.TAG_ID.HEAD || tn === html_js_1.TAG_ID.BODY || tn === html_js_1.TAG_ID.HTML || tn === html_js_1.TAG_ID.BR) {
|
2020-12-18 22:06:30 +00:00
|
|
|
tokenBeforeHead(p, token);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
p._err(token, error_codes_js_1.ERR.endTagWithoutMatchingOpenElement);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function tokenBeforeHead(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertFakeElement(html_js_1.TAG_NAMES.HEAD, html_js_1.TAG_ID.HEAD);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.headElement = p.openElements.current;
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.IN_HEAD;
|
2020-12-18 22:06:30 +00:00
|
|
|
p._processToken(token);
|
|
|
|
}
|
|
|
|
// The "in head" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagInHead(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
startTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BASE:
|
|
|
|
case html_js_1.TAG_ID.BASEFONT:
|
|
|
|
case html_js_1.TAG_ID.BGSOUND:
|
|
|
|
case html_js_1.TAG_ID.LINK:
|
|
|
|
case html_js_1.TAG_ID.META: {
|
|
|
|
p._appendElement(token, html_js_1.NS.HTML);
|
|
|
|
token.ackSelfClosing = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TITLE: {
|
|
|
|
p._switchToTextParsing(token, index_js_1.TokenizerMode.RCDATA);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.NOSCRIPT: {
|
|
|
|
if (p.options.scriptingEnabled) {
|
|
|
|
p._switchToTextParsing(token, index_js_1.TokenizerMode.RAWTEXT);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.insertionMode = InsertionMode.IN_HEAD_NO_SCRIPT;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.NOFRAMES:
|
|
|
|
case html_js_1.TAG_ID.STYLE: {
|
|
|
|
p._switchToTextParsing(token, index_js_1.TokenizerMode.RAWTEXT);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.SCRIPT: {
|
|
|
|
p._switchToTextParsing(token, index_js_1.TokenizerMode.SCRIPT_DATA);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
p._insertTemplate(token);
|
|
|
|
p.activeFormattingElements.insertMarker();
|
|
|
|
p.framesetOk = false;
|
|
|
|
p.insertionMode = InsertionMode.IN_TEMPLATE;
|
|
|
|
p.tmplInsertionModeStack.unshift(InsertionMode.IN_TEMPLATE);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.HEAD: {
|
|
|
|
p._err(token, error_codes_js_1.ERR.misplacedStartTagForHeadElement);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
tokenInHead(p, token);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInHead(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.HEAD: {
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = InsertionMode.AFTER_HEAD;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BODY:
|
|
|
|
case html_js_1.TAG_ID.BR:
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
tokenInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
if (p.openElements.tmplCount > 0) {
|
|
|
|
p.openElements.generateImpliedEndTagsThoroughly();
|
|
|
|
if (p.openElements.currentTagId !== html_js_1.TAG_ID.TEMPLATE) {
|
|
|
|
p._err(token, error_codes_js_1.ERR.closingOfElementWithOpenChildElements);
|
|
|
|
}
|
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.TEMPLATE);
|
|
|
|
p.activeFormattingElements.clearToLastMarker();
|
|
|
|
p.tmplInsertionModeStack.shift();
|
|
|
|
p._resetInsertionMode();
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
else {
|
|
|
|
p._err(token, error_codes_js_1.ERR.endTagWithoutMatchingOpenElement);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
p._err(token, error_codes_js_1.ERR.endTagWithoutMatchingOpenElement);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function tokenInHead(p, token) {
|
|
|
|
p.openElements.pop();
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.AFTER_HEAD;
|
2020-12-18 22:06:30 +00:00
|
|
|
p._processToken(token);
|
|
|
|
}
|
|
|
|
// The "in head no script" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagInHeadNoScript(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
startTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BASEFONT:
|
|
|
|
case html_js_1.TAG_ID.BGSOUND:
|
|
|
|
case html_js_1.TAG_ID.HEAD:
|
|
|
|
case html_js_1.TAG_ID.LINK:
|
|
|
|
case html_js_1.TAG_ID.META:
|
|
|
|
case html_js_1.TAG_ID.NOFRAMES:
|
|
|
|
case html_js_1.TAG_ID.STYLE: {
|
|
|
|
startTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.NOSCRIPT: {
|
|
|
|
p._err(token, error_codes_js_1.ERR.nestedNoscriptInHead);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
tokenInHeadNoScript(p, token);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInHeadNoScript(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.NOSCRIPT: {
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = InsertionMode.IN_HEAD;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BR: {
|
|
|
|
tokenInHeadNoScript(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
p._err(token, error_codes_js_1.ERR.endTagWithoutMatchingOpenElement);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function tokenInHeadNoScript(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const errCode = token.type === token_js_1.TokenType.EOF ? error_codes_js_1.ERR.openElementsLeftAfterEof : error_codes_js_1.ERR.disallowedContentInNoscriptInHead;
|
|
|
|
p._err(token, errCode);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.pop();
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.IN_HEAD;
|
2020-12-18 22:06:30 +00:00
|
|
|
p._processToken(token);
|
|
|
|
}
|
|
|
|
// The "after head" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagAfterHead(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
startTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BODY: {
|
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.framesetOk = false;
|
|
|
|
p.insertionMode = InsertionMode.IN_BODY;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.FRAMESET: {
|
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.insertionMode = InsertionMode.IN_FRAMESET;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BASE:
|
|
|
|
case html_js_1.TAG_ID.BASEFONT:
|
|
|
|
case html_js_1.TAG_ID.BGSOUND:
|
|
|
|
case html_js_1.TAG_ID.LINK:
|
|
|
|
case html_js_1.TAG_ID.META:
|
|
|
|
case html_js_1.TAG_ID.NOFRAMES:
|
|
|
|
case html_js_1.TAG_ID.SCRIPT:
|
|
|
|
case html_js_1.TAG_ID.STYLE:
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE:
|
|
|
|
case html_js_1.TAG_ID.TITLE: {
|
|
|
|
p._err(token, error_codes_js_1.ERR.abandonedHeadElementChild);
|
|
|
|
p.openElements.push(p.headElement, html_js_1.TAG_ID.HEAD);
|
|
|
|
startTagInHead(p, token);
|
|
|
|
p.openElements.remove(p.headElement);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.HEAD: {
|
|
|
|
p._err(token, error_codes_js_1.ERR.misplacedStartTagForHeadElement);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
tokenAfterHead(p, token);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagAfterHead(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.BODY:
|
|
|
|
case html_js_1.TAG_ID.HTML:
|
|
|
|
case html_js_1.TAG_ID.BR: {
|
|
|
|
tokenAfterHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
endTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
p._err(token, error_codes_js_1.ERR.endTagWithoutMatchingOpenElement);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function tokenAfterHead(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertFakeElement(html_js_1.TAG_NAMES.BODY, html_js_1.TAG_ID.BODY);
|
|
|
|
p.insertionMode = InsertionMode.IN_BODY;
|
|
|
|
modeInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
// The "in body" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
function modeInBody(p, token) {
|
|
|
|
switch (token.type) {
|
|
|
|
case token_js_1.TokenType.CHARACTER: {
|
|
|
|
characterInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.WHITESPACE_CHARACTER: {
|
|
|
|
whitespaceCharacterInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.COMMENT: {
|
|
|
|
appendComment(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.START_TAG: {
|
|
|
|
startTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.END_TAG: {
|
|
|
|
endTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.EOF: {
|
|
|
|
eofInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
// Do nothing
|
|
|
|
}
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
function whitespaceCharacterInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
|
|
|
p._insertCharacters(token);
|
|
|
|
}
|
|
|
|
function characterInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
|
|
|
p._insertCharacters(token);
|
|
|
|
p.framesetOk = false;
|
|
|
|
}
|
|
|
|
function htmlStartTagInBody(p, token) {
|
|
|
|
if (p.openElements.tmplCount === 0) {
|
|
|
|
p.treeAdapter.adoptAttributes(p.openElements.items[0], token.attrs);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function bodyStartTagInBody(p, token) {
|
|
|
|
const bodyElement = p.openElements.tryPeekProperlyNestedBodyElement();
|
|
|
|
if (bodyElement && p.openElements.tmplCount === 0) {
|
|
|
|
p.framesetOk = false;
|
|
|
|
p.treeAdapter.adoptAttributes(bodyElement, token.attrs);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function framesetStartTagInBody(p, token) {
|
|
|
|
const bodyElement = p.openElements.tryPeekProperlyNestedBodyElement();
|
|
|
|
if (p.framesetOk && bodyElement) {
|
|
|
|
p.treeAdapter.detachNode(bodyElement);
|
|
|
|
p.openElements.popAllUpToHtmlElement();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.insertionMode = InsertionMode.IN_FRAMESET;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function addressStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInButtonScope(html_js_1.TAG_ID.P)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._closePElement();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function numberedHeaderStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInButtonScope(html_js_1.TAG_ID.P)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._closePElement();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if ((0, html_js_1.isNumberedHeader)(p.openElements.currentTagId)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.pop();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function preStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInButtonScope(html_js_1.TAG_ID.P)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._closePElement();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
//NOTE: If the next token is a U+000A LINE FEED (LF) character token, then ignore that token and move
|
|
|
|
//on to the next one. (Newlines at the start of pre blocks are ignored as an authoring convenience.)
|
|
|
|
p.skipNextNewLine = true;
|
|
|
|
p.framesetOk = false;
|
|
|
|
}
|
|
|
|
function formStartTagInBody(p, token) {
|
|
|
|
const inTemplate = p.openElements.tmplCount > 0;
|
|
|
|
if (!p.formElement || inTemplate) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInButtonScope(html_js_1.TAG_ID.P)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._closePElement();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
if (!inTemplate) {
|
|
|
|
p.formElement = p.openElements.current;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function listItemStartTagInBody(p, token) {
|
|
|
|
p.framesetOk = false;
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
2020-12-18 22:06:30 +00:00
|
|
|
for (let i = p.openElements.stackTop; i >= 0; i--) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const elementId = p.openElements.tagIDs[i];
|
|
|
|
if ((tn === html_js_1.TAG_ID.LI && elementId === html_js_1.TAG_ID.LI) ||
|
|
|
|
((tn === html_js_1.TAG_ID.DD || tn === html_js_1.TAG_ID.DT) && (elementId === html_js_1.TAG_ID.DD || elementId === html_js_1.TAG_ID.DT))) {
|
|
|
|
p.openElements.generateImpliedEndTagsWithExclusion(elementId);
|
|
|
|
p.openElements.popUntilTagNamePopped(elementId);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (elementId !== html_js_1.TAG_ID.ADDRESS &&
|
|
|
|
elementId !== html_js_1.TAG_ID.DIV &&
|
|
|
|
elementId !== html_js_1.TAG_ID.P &&
|
|
|
|
p._isSpecialElement(p.openElements.items[i], elementId)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInButtonScope(html_js_1.TAG_ID.P)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._closePElement();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function plaintextStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInButtonScope(html_js_1.TAG_ID.P)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._closePElement();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.tokenizer.state = index_js_1.TokenizerMode.PLAINTEXT;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function buttonStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInScope(html_js_1.TAG_ID.BUTTON)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.generateImpliedEndTags();
|
2022-05-17 01:25:05 +00:00
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.BUTTON);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.framesetOk = false;
|
|
|
|
}
|
|
|
|
function aStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const activeElementEntry = p.activeFormattingElements.getElementEntryInScopeWithTagName(html_js_1.TAG_NAMES.A);
|
2020-12-18 22:06:30 +00:00
|
|
|
if (activeElementEntry) {
|
|
|
|
callAdoptionAgency(p, token);
|
|
|
|
p.openElements.remove(activeElementEntry.element);
|
|
|
|
p.activeFormattingElements.removeEntry(activeElementEntry);
|
|
|
|
}
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.activeFormattingElements.pushElement(p.openElements.current, token);
|
|
|
|
}
|
|
|
|
function bStartTagInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.activeFormattingElements.pushElement(p.openElements.current, token);
|
|
|
|
}
|
|
|
|
function nobrStartTagInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInScope(html_js_1.TAG_ID.NOBR)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
callAdoptionAgency(p, token);
|
|
|
|
p._reconstructActiveFormattingElements();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.activeFormattingElements.pushElement(p.openElements.current, token);
|
|
|
|
}
|
|
|
|
function appletStartTagInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.activeFormattingElements.insertMarker();
|
|
|
|
p.framesetOk = false;
|
|
|
|
}
|
|
|
|
function tableStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.treeAdapter.getDocumentMode(p.document) !== html_js_1.DOCUMENT_MODE.QUIRKS && p.openElements.hasInButtonScope(html_js_1.TAG_ID.P)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._closePElement();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.framesetOk = false;
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.IN_TABLE;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function areaStartTagInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._appendElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.framesetOk = false;
|
|
|
|
token.ackSelfClosing = true;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
function isHiddenInput(token) {
|
|
|
|
const inputType = (0, token_js_1.getTokenAttr)(token, html_js_1.ATTRS.TYPE);
|
|
|
|
return inputType != null && inputType.toLowerCase() === HIDDEN_INPUT_TYPE;
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
function inputStartTagInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._appendElement(token, html_js_1.NS.HTML);
|
|
|
|
if (!isHiddenInput(token)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.framesetOk = false;
|
|
|
|
}
|
|
|
|
token.ackSelfClosing = true;
|
|
|
|
}
|
|
|
|
function paramStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._appendElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
token.ackSelfClosing = true;
|
|
|
|
}
|
|
|
|
function hrStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInButtonScope(html_js_1.TAG_ID.P)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._closePElement();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._appendElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.framesetOk = false;
|
|
|
|
token.ackSelfClosing = true;
|
|
|
|
}
|
|
|
|
function imageStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
token.tagName = html_js_1.TAG_NAMES.IMG;
|
|
|
|
token.tagID = html_js_1.TAG_ID.IMG;
|
2020-12-18 22:06:30 +00:00
|
|
|
areaStartTagInBody(p, token);
|
|
|
|
}
|
|
|
|
function textareaStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
//NOTE: If the next token is a U+000A LINE FEED (LF) character token, then ignore that token and move
|
|
|
|
//on to the next one. (Newlines at the start of textarea elements are ignored as an authoring convenience.)
|
|
|
|
p.skipNextNewLine = true;
|
2022-05-17 01:25:05 +00:00
|
|
|
p.tokenizer.state = index_js_1.TokenizerMode.RCDATA;
|
2020-12-18 22:06:30 +00:00
|
|
|
p.originalInsertionMode = p.insertionMode;
|
|
|
|
p.framesetOk = false;
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.TEXT;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function xmpStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInButtonScope(html_js_1.TAG_ID.P)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._closePElement();
|
|
|
|
}
|
|
|
|
p._reconstructActiveFormattingElements();
|
|
|
|
p.framesetOk = false;
|
2022-05-17 01:25:05 +00:00
|
|
|
p._switchToTextParsing(token, index_js_1.TokenizerMode.RAWTEXT);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function iframeStartTagInBody(p, token) {
|
|
|
|
p.framesetOk = false;
|
2022-05-17 01:25:05 +00:00
|
|
|
p._switchToTextParsing(token, index_js_1.TokenizerMode.RAWTEXT);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//NOTE: here we assume that we always act as an user agent with enabled plugins, so we parse
|
2022-05-17 01:25:05 +00:00
|
|
|
//<noembed> as rawtext.
|
2020-12-18 22:06:30 +00:00
|
|
|
function noembedStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._switchToTextParsing(token, index_js_1.TokenizerMode.RAWTEXT);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function selectStartTagInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.framesetOk = false;
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode =
|
|
|
|
p.insertionMode === InsertionMode.IN_TABLE ||
|
|
|
|
p.insertionMode === InsertionMode.IN_CAPTION ||
|
|
|
|
p.insertionMode === InsertionMode.IN_TABLE_BODY ||
|
|
|
|
p.insertionMode === InsertionMode.IN_ROW ||
|
|
|
|
p.insertionMode === InsertionMode.IN_CELL
|
|
|
|
? InsertionMode.IN_SELECT_IN_TABLE
|
|
|
|
: InsertionMode.IN_SELECT;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function optgroupStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.currentTagId === html_js_1.TAG_ID.OPTION) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.pop();
|
|
|
|
}
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function rbStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInScope(html_js_1.TAG_ID.RUBY)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.generateImpliedEndTags();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function rtStartTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInScope(html_js_1.TAG_ID.RUBY)) {
|
|
|
|
p.openElements.generateImpliedEndTagsWithExclusion(html_js_1.TAG_ID.RTC);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function mathStartTagInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
|
|
|
foreignContent.adjustTokenMathMLAttrs(token);
|
|
|
|
foreignContent.adjustTokenXMLAttrs(token);
|
|
|
|
if (token.selfClosing) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._appendElement(token, html_js_1.NS.MATHML);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
p._insertElement(token, html_js_1.NS.MATHML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
token.ackSelfClosing = true;
|
|
|
|
}
|
|
|
|
function svgStartTagInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
|
|
|
foreignContent.adjustTokenSVGAttrs(token);
|
|
|
|
foreignContent.adjustTokenXMLAttrs(token);
|
|
|
|
if (token.selfClosing) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._appendElement(token, html_js_1.NS.SVG);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
p._insertElement(token, html_js_1.NS.SVG);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
token.ackSelfClosing = true;
|
|
|
|
}
|
|
|
|
function genericStartTagInBody(p, token) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function startTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.I:
|
|
|
|
case html_js_1.TAG_ID.S:
|
|
|
|
case html_js_1.TAG_ID.B:
|
|
|
|
case html_js_1.TAG_ID.U:
|
|
|
|
case html_js_1.TAG_ID.EM:
|
|
|
|
case html_js_1.TAG_ID.TT:
|
|
|
|
case html_js_1.TAG_ID.BIG:
|
|
|
|
case html_js_1.TAG_ID.CODE:
|
|
|
|
case html_js_1.TAG_ID.FONT:
|
|
|
|
case html_js_1.TAG_ID.SMALL:
|
|
|
|
case html_js_1.TAG_ID.STRIKE:
|
|
|
|
case html_js_1.TAG_ID.STRONG: {
|
|
|
|
bStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.A: {
|
|
|
|
aStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.H1:
|
|
|
|
case html_js_1.TAG_ID.H2:
|
|
|
|
case html_js_1.TAG_ID.H3:
|
|
|
|
case html_js_1.TAG_ID.H4:
|
|
|
|
case html_js_1.TAG_ID.H5:
|
|
|
|
case html_js_1.TAG_ID.H6: {
|
|
|
|
numberedHeaderStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.P:
|
|
|
|
case html_js_1.TAG_ID.DL:
|
|
|
|
case html_js_1.TAG_ID.OL:
|
|
|
|
case html_js_1.TAG_ID.UL:
|
|
|
|
case html_js_1.TAG_ID.DIV:
|
|
|
|
case html_js_1.TAG_ID.DIR:
|
|
|
|
case html_js_1.TAG_ID.NAV:
|
|
|
|
case html_js_1.TAG_ID.MAIN:
|
|
|
|
case html_js_1.TAG_ID.MENU:
|
|
|
|
case html_js_1.TAG_ID.ASIDE:
|
|
|
|
case html_js_1.TAG_ID.CENTER:
|
|
|
|
case html_js_1.TAG_ID.FIGURE:
|
|
|
|
case html_js_1.TAG_ID.FOOTER:
|
|
|
|
case html_js_1.TAG_ID.HEADER:
|
|
|
|
case html_js_1.TAG_ID.HGROUP:
|
|
|
|
case html_js_1.TAG_ID.DIALOG:
|
|
|
|
case html_js_1.TAG_ID.DETAILS:
|
|
|
|
case html_js_1.TAG_ID.ADDRESS:
|
|
|
|
case html_js_1.TAG_ID.ARTICLE:
|
|
|
|
case html_js_1.TAG_ID.SECTION:
|
|
|
|
case html_js_1.TAG_ID.SUMMARY:
|
|
|
|
case html_js_1.TAG_ID.FIELDSET:
|
|
|
|
case html_js_1.TAG_ID.BLOCKQUOTE:
|
|
|
|
case html_js_1.TAG_ID.FIGCAPTION: {
|
|
|
|
addressStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.LI:
|
|
|
|
case html_js_1.TAG_ID.DD:
|
|
|
|
case html_js_1.TAG_ID.DT: {
|
|
|
|
listItemStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BR:
|
|
|
|
case html_js_1.TAG_ID.IMG:
|
|
|
|
case html_js_1.TAG_ID.WBR:
|
|
|
|
case html_js_1.TAG_ID.AREA:
|
|
|
|
case html_js_1.TAG_ID.EMBED:
|
|
|
|
case html_js_1.TAG_ID.KEYGEN: {
|
|
|
|
areaStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.HR: {
|
|
|
|
hrStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.RB:
|
|
|
|
case html_js_1.TAG_ID.RTC: {
|
|
|
|
rbStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.RT:
|
|
|
|
case html_js_1.TAG_ID.RP: {
|
|
|
|
rtStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.PRE:
|
|
|
|
case html_js_1.TAG_ID.LISTING: {
|
|
|
|
preStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.XMP: {
|
|
|
|
xmpStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.SVG: {
|
|
|
|
svgStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
htmlStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BASE:
|
|
|
|
case html_js_1.TAG_ID.LINK:
|
|
|
|
case html_js_1.TAG_ID.META:
|
|
|
|
case html_js_1.TAG_ID.STYLE:
|
|
|
|
case html_js_1.TAG_ID.TITLE:
|
|
|
|
case html_js_1.TAG_ID.SCRIPT:
|
|
|
|
case html_js_1.TAG_ID.BGSOUND:
|
|
|
|
case html_js_1.TAG_ID.BASEFONT:
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
startTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BODY: {
|
|
|
|
bodyStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.FORM: {
|
|
|
|
formStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.NOBR: {
|
|
|
|
nobrStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.MATH: {
|
|
|
|
mathStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TABLE: {
|
|
|
|
tableStartTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.INPUT: {
|
|
|
|
inputStartTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.PARAM:
|
|
|
|
case html_js_1.TAG_ID.TRACK:
|
|
|
|
case html_js_1.TAG_ID.SOURCE: {
|
|
|
|
paramStartTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.IMAGE: {
|
|
|
|
imageStartTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BUTTON: {
|
|
|
|
buttonStartTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.APPLET:
|
|
|
|
case html_js_1.TAG_ID.OBJECT:
|
|
|
|
case html_js_1.TAG_ID.MARQUEE: {
|
|
|
|
appletStartTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.IFRAME: {
|
|
|
|
iframeStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.SELECT: {
|
|
|
|
selectStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.OPTION:
|
|
|
|
case html_js_1.TAG_ID.OPTGROUP: {
|
|
|
|
optgroupStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.NOEMBED: {
|
|
|
|
noembedStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.FRAMESET: {
|
|
|
|
framesetStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TEXTAREA: {
|
|
|
|
textareaStartTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.NOSCRIPT: {
|
|
|
|
if (p.options.scriptingEnabled) {
|
2020-12-18 22:06:30 +00:00
|
|
|
noembedStartTagInBody(p, token);
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
genericStartTagInBody(p, token);
|
|
|
|
}
|
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.PLAINTEXT: {
|
|
|
|
plaintextStartTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.COL:
|
|
|
|
case html_js_1.TAG_ID.TH:
|
|
|
|
case html_js_1.TAG_ID.TD:
|
|
|
|
case html_js_1.TAG_ID.TR:
|
|
|
|
case html_js_1.TAG_ID.HEAD:
|
|
|
|
case html_js_1.TAG_ID.FRAME:
|
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
case html_js_1.TAG_ID.THEAD:
|
|
|
|
case html_js_1.TAG_ID.CAPTION:
|
|
|
|
case html_js_1.TAG_ID.COLGROUP: {
|
|
|
|
// Ignore token
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
default: {
|
2020-12-18 22:06:30 +00:00
|
|
|
genericStartTagInBody(p, token);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
function bodyEndTagInBody(p, token) {
|
|
|
|
if (p.openElements.hasInScope(html_js_1.TAG_ID.BODY)) {
|
|
|
|
p.insertionMode = InsertionMode.AFTER_BODY;
|
|
|
|
//NOTE: <body> is never popped from the stack, so we need to updated
|
|
|
|
//the end location explicitly.
|
|
|
|
if (p.options.sourceCodeLocationInfo) {
|
|
|
|
const bodyElement = p.openElements.tryPeekProperlyNestedBodyElement();
|
|
|
|
if (bodyElement) {
|
|
|
|
p._setEndLocation(bodyElement, token);
|
|
|
|
}
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function htmlEndTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInScope(html_js_1.TAG_ID.BODY)) {
|
|
|
|
p.insertionMode = InsertionMode.AFTER_BODY;
|
|
|
|
endTagAfterBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function addressEndTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (p.openElements.hasInScope(tn)) {
|
|
|
|
p.openElements.generateImpliedEndTags();
|
|
|
|
p.openElements.popUntilTagNamePopped(tn);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function formEndTagInBody(p) {
|
|
|
|
const inTemplate = p.openElements.tmplCount > 0;
|
2022-05-17 01:25:05 +00:00
|
|
|
const { formElement } = p;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (!inTemplate) {
|
|
|
|
p.formElement = null;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if ((formElement || inTemplate) && p.openElements.hasInScope(html_js_1.TAG_ID.FORM)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.generateImpliedEndTags();
|
|
|
|
if (inTemplate) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.FORM);
|
|
|
|
}
|
|
|
|
else if (formElement) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.remove(formElement);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function pEndTagInBody(p) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (!p.openElements.hasInButtonScope(html_js_1.TAG_ID.P)) {
|
|
|
|
p._insertFakeElement(html_js_1.TAG_NAMES.P, html_js_1.TAG_ID.P);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
p._closePElement();
|
|
|
|
}
|
|
|
|
function liEndTagInBody(p) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInListItemScope(html_js_1.TAG_ID.LI)) {
|
|
|
|
p.openElements.generateImpliedEndTagsWithExclusion(html_js_1.TAG_ID.LI);
|
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.LI);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function ddEndTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (p.openElements.hasInScope(tn)) {
|
|
|
|
p.openElements.generateImpliedEndTagsWithExclusion(tn);
|
|
|
|
p.openElements.popUntilTagNamePopped(tn);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function numberedHeaderEndTagInBody(p) {
|
|
|
|
if (p.openElements.hasNumberedHeaderInScope()) {
|
|
|
|
p.openElements.generateImpliedEndTags();
|
|
|
|
p.openElements.popUntilNumberedHeaderPopped();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function appletEndTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (p.openElements.hasInScope(tn)) {
|
|
|
|
p.openElements.generateImpliedEndTags();
|
|
|
|
p.openElements.popUntilTagNamePopped(tn);
|
|
|
|
p.activeFormattingElements.clearToLastMarker();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function brEndTagInBody(p) {
|
|
|
|
p._reconstructActiveFormattingElements();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertFakeElement(html_js_1.TAG_NAMES.BR, html_js_1.TAG_ID.BR);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.pop();
|
|
|
|
p.framesetOk = false;
|
|
|
|
}
|
|
|
|
function genericEndTagInBody(p, token) {
|
|
|
|
const tn = token.tagName;
|
2022-05-17 01:25:05 +00:00
|
|
|
const tid = token.tagID;
|
2020-12-18 22:06:30 +00:00
|
|
|
for (let i = p.openElements.stackTop; i > 0; i--) {
|
|
|
|
const element = p.openElements.items[i];
|
2022-05-17 01:25:05 +00:00
|
|
|
const elementId = p.openElements.tagIDs[i];
|
|
|
|
// Compare the tag name here, as the tag might not be a known tag with an ID.
|
|
|
|
if (tid === elementId && (tid !== html_js_1.TAG_ID.UNKNOWN || p.treeAdapter.getTagName(element) === tn)) {
|
|
|
|
p.openElements.generateImpliedEndTagsWithExclusion(tid);
|
|
|
|
if (p.openElements.stackTop >= i)
|
|
|
|
p.openElements.shortenToLength(i);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p._isSpecialElement(element, elementId)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.A:
|
|
|
|
case html_js_1.TAG_ID.B:
|
|
|
|
case html_js_1.TAG_ID.I:
|
|
|
|
case html_js_1.TAG_ID.S:
|
|
|
|
case html_js_1.TAG_ID.U:
|
|
|
|
case html_js_1.TAG_ID.EM:
|
|
|
|
case html_js_1.TAG_ID.TT:
|
|
|
|
case html_js_1.TAG_ID.BIG:
|
|
|
|
case html_js_1.TAG_ID.CODE:
|
|
|
|
case html_js_1.TAG_ID.FONT:
|
|
|
|
case html_js_1.TAG_ID.NOBR:
|
|
|
|
case html_js_1.TAG_ID.SMALL:
|
|
|
|
case html_js_1.TAG_ID.STRIKE:
|
|
|
|
case html_js_1.TAG_ID.STRONG: {
|
|
|
|
callAdoptionAgency(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.P: {
|
|
|
|
pEndTagInBody(p);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.DL:
|
|
|
|
case html_js_1.TAG_ID.UL:
|
|
|
|
case html_js_1.TAG_ID.OL:
|
|
|
|
case html_js_1.TAG_ID.DIR:
|
|
|
|
case html_js_1.TAG_ID.DIV:
|
|
|
|
case html_js_1.TAG_ID.NAV:
|
|
|
|
case html_js_1.TAG_ID.PRE:
|
|
|
|
case html_js_1.TAG_ID.MAIN:
|
|
|
|
case html_js_1.TAG_ID.MENU:
|
|
|
|
case html_js_1.TAG_ID.ASIDE:
|
|
|
|
case html_js_1.TAG_ID.CENTER:
|
|
|
|
case html_js_1.TAG_ID.FIGURE:
|
|
|
|
case html_js_1.TAG_ID.FOOTER:
|
|
|
|
case html_js_1.TAG_ID.HEADER:
|
|
|
|
case html_js_1.TAG_ID.HGROUP:
|
|
|
|
case html_js_1.TAG_ID.DIALOG:
|
|
|
|
case html_js_1.TAG_ID.ADDRESS:
|
|
|
|
case html_js_1.TAG_ID.ARTICLE:
|
|
|
|
case html_js_1.TAG_ID.DETAILS:
|
|
|
|
case html_js_1.TAG_ID.SECTION:
|
|
|
|
case html_js_1.TAG_ID.SUMMARY:
|
|
|
|
case html_js_1.TAG_ID.LISTING:
|
|
|
|
case html_js_1.TAG_ID.FIELDSET:
|
|
|
|
case html_js_1.TAG_ID.BLOCKQUOTE:
|
|
|
|
case html_js_1.TAG_ID.FIGCAPTION: {
|
|
|
|
addressEndTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.LI: {
|
|
|
|
liEndTagInBody(p);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.DD:
|
|
|
|
case html_js_1.TAG_ID.DT: {
|
|
|
|
ddEndTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.H1:
|
|
|
|
case html_js_1.TAG_ID.H2:
|
|
|
|
case html_js_1.TAG_ID.H3:
|
|
|
|
case html_js_1.TAG_ID.H4:
|
|
|
|
case html_js_1.TAG_ID.H5:
|
|
|
|
case html_js_1.TAG_ID.H6: {
|
|
|
|
numberedHeaderEndTagInBody(p);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BR: {
|
|
|
|
brEndTagInBody(p);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BODY: {
|
|
|
|
bodyEndTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
htmlEndTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.FORM: {
|
|
|
|
formEndTagInBody(p);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.APPLET:
|
|
|
|
case html_js_1.TAG_ID.OBJECT:
|
|
|
|
case html_js_1.TAG_ID.MARQUEE: {
|
|
|
|
appletEndTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
endTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
2020-12-18 22:06:30 +00:00
|
|
|
genericEndTagInBody(p, token);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function eofInBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.tmplInsertionModeStack.length > 0) {
|
2020-12-18 22:06:30 +00:00
|
|
|
eofInTemplate(p, token);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
stopParsing(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// The "text" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function endTagInText(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
var _a;
|
|
|
|
if (token.tagID === html_js_1.TAG_ID.SCRIPT) {
|
|
|
|
(_a = p.scriptHandler) === null || _a === void 0 ? void 0 : _a.call(p, p.openElements.current);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = p.originalInsertionMode;
|
|
|
|
}
|
|
|
|
function eofInText(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._err(token, error_codes_js_1.ERR.eofInElementThatCanContainOnlyText);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = p.originalInsertionMode;
|
2022-05-17 01:25:05 +00:00
|
|
|
p.onEof(token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
// The "in table" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function characterInTable(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (TABLE_STRUCTURE_TAGS.has(p.openElements.currentTagId)) {
|
|
|
|
p.pendingCharacterTokens.length = 0;
|
2020-12-18 22:06:30 +00:00
|
|
|
p.hasNonWhitespacePendingCharacterToken = false;
|
|
|
|
p.originalInsertionMode = p.insertionMode;
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.IN_TABLE_TEXT;
|
|
|
|
switch (token.type) {
|
|
|
|
case token_js_1.TokenType.CHARACTER: {
|
|
|
|
characterInTableText(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.WHITESPACE_CHARACTER: {
|
|
|
|
whitespaceCharacterInTableText(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
// Ignore null
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
tokenInTable(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function captionStartTagInTable(p, token) {
|
|
|
|
p.openElements.clearBackToTableContext();
|
|
|
|
p.activeFormattingElements.insertMarker();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.insertionMode = InsertionMode.IN_CAPTION;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function colgroupStartTagInTable(p, token) {
|
|
|
|
p.openElements.clearBackToTableContext();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.insertionMode = InsertionMode.IN_COLUMN_GROUP;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function colStartTagInTable(p, token) {
|
|
|
|
p.openElements.clearBackToTableContext();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertFakeElement(html_js_1.TAG_NAMES.COLGROUP, html_js_1.TAG_ID.COLGROUP);
|
|
|
|
p.insertionMode = InsertionMode.IN_COLUMN_GROUP;
|
|
|
|
startTagInColumnGroup(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function tbodyStartTagInTable(p, token) {
|
|
|
|
p.openElements.clearBackToTableContext();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE_BODY;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function tdStartTagInTable(p, token) {
|
|
|
|
p.openElements.clearBackToTableContext();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertFakeElement(html_js_1.TAG_NAMES.TBODY, html_js_1.TAG_ID.TBODY);
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE_BODY;
|
|
|
|
startTagInTableBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function tableStartTagInTable(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.hasInTableScope(html_js_1.TAG_ID.TABLE)) {
|
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.TABLE);
|
2020-12-18 22:06:30 +00:00
|
|
|
p._resetInsertionMode();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._processStartTag(token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function inputStartTagInTable(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (isHiddenInput(token)) {
|
|
|
|
p._appendElement(token, html_js_1.NS.HTML);
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
tokenInTable(p, token);
|
|
|
|
}
|
|
|
|
token.ackSelfClosing = true;
|
|
|
|
}
|
|
|
|
function formStartTagInTable(p, token) {
|
|
|
|
if (!p.formElement && p.openElements.tmplCount === 0) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.formElement = p.openElements.current;
|
|
|
|
p.openElements.pop();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function startTagInTable(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.TD:
|
|
|
|
case html_js_1.TAG_ID.TH:
|
|
|
|
case html_js_1.TAG_ID.TR: {
|
|
|
|
tdStartTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.STYLE:
|
|
|
|
case html_js_1.TAG_ID.SCRIPT:
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
startTagInHead(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.COL: {
|
|
|
|
colStartTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.FORM: {
|
|
|
|
formStartTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TABLE: {
|
|
|
|
tableStartTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
case html_js_1.TAG_ID.THEAD: {
|
|
|
|
tbodyStartTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.INPUT: {
|
|
|
|
inputStartTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.CAPTION: {
|
|
|
|
captionStartTagInTable(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.COLGROUP: {
|
|
|
|
colgroupStartTagInTable(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
2020-12-18 22:06:30 +00:00
|
|
|
tokenInTable(p, token);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInTable(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.TABLE: {
|
|
|
|
if (p.openElements.hasInTableScope(html_js_1.TAG_ID.TABLE)) {
|
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.TABLE);
|
|
|
|
p._resetInsertionMode();
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
endTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BODY:
|
|
|
|
case html_js_1.TAG_ID.CAPTION:
|
|
|
|
case html_js_1.TAG_ID.COL:
|
|
|
|
case html_js_1.TAG_ID.COLGROUP:
|
|
|
|
case html_js_1.TAG_ID.HTML:
|
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.TD:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
case html_js_1.TAG_ID.TH:
|
|
|
|
case html_js_1.TAG_ID.THEAD:
|
|
|
|
case html_js_1.TAG_ID.TR: {
|
|
|
|
// Ignore token
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
tokenInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function tokenInTable(p, token) {
|
|
|
|
const savedFosterParentingState = p.fosterParentingEnabled;
|
|
|
|
p.fosterParentingEnabled = true;
|
2022-05-17 01:25:05 +00:00
|
|
|
// Process token in `In Body` mode
|
|
|
|
modeInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.fosterParentingEnabled = savedFosterParentingState;
|
|
|
|
}
|
|
|
|
// The "in table text" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function whitespaceCharacterInTableText(p, token) {
|
|
|
|
p.pendingCharacterTokens.push(token);
|
|
|
|
}
|
|
|
|
function characterInTableText(p, token) {
|
|
|
|
p.pendingCharacterTokens.push(token);
|
|
|
|
p.hasNonWhitespacePendingCharacterToken = true;
|
|
|
|
}
|
|
|
|
function tokenInTableText(p, token) {
|
|
|
|
let i = 0;
|
|
|
|
if (p.hasNonWhitespacePendingCharacterToken) {
|
|
|
|
for (; i < p.pendingCharacterTokens.length; i++) {
|
|
|
|
tokenInTable(p, p.pendingCharacterTokens[i]);
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
for (; i < p.pendingCharacterTokens.length; i++) {
|
|
|
|
p._insertCharacters(p.pendingCharacterTokens[i]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
p.insertionMode = p.originalInsertionMode;
|
|
|
|
p._processToken(token);
|
|
|
|
}
|
|
|
|
// The "in caption" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
const TABLE_VOID_ELEMENTS = new Set([html_js_1.TAG_ID.CAPTION, html_js_1.TAG_ID.COL, html_js_1.TAG_ID.COLGROUP, html_js_1.TAG_ID.TBODY, html_js_1.TAG_ID.TD, html_js_1.TAG_ID.TFOOT, html_js_1.TAG_ID.TH, html_js_1.TAG_ID.THEAD, html_js_1.TAG_ID.TR]);
|
2020-12-18 22:06:30 +00:00
|
|
|
function startTagInCaption(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
|
|
|
if (TABLE_VOID_ELEMENTS.has(tn)) {
|
|
|
|
if (p.openElements.hasInTableScope(html_js_1.TAG_ID.CAPTION)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.generateImpliedEndTags();
|
2022-05-17 01:25:05 +00:00
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.CAPTION);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.activeFormattingElements.clearToLastMarker();
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.IN_TABLE;
|
|
|
|
startTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
startTagInBody(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInCaption(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
|
|
|
switch (tn) {
|
|
|
|
case html_js_1.TAG_ID.CAPTION:
|
|
|
|
case html_js_1.TAG_ID.TABLE: {
|
|
|
|
if (p.openElements.hasInTableScope(html_js_1.TAG_ID.CAPTION)) {
|
|
|
|
p.openElements.generateImpliedEndTags();
|
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.CAPTION);
|
|
|
|
p.activeFormattingElements.clearToLastMarker();
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE;
|
|
|
|
if (tn === html_js_1.TAG_ID.TABLE) {
|
|
|
|
endTagInTable(p, token);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BODY:
|
|
|
|
case html_js_1.TAG_ID.COL:
|
|
|
|
case html_js_1.TAG_ID.COLGROUP:
|
|
|
|
case html_js_1.TAG_ID.HTML:
|
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.TD:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
case html_js_1.TAG_ID.TH:
|
|
|
|
case html_js_1.TAG_ID.THEAD:
|
|
|
|
case html_js_1.TAG_ID.TR: {
|
|
|
|
// Ignore token
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
endTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// The "in column group" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagInColumnGroup(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
startTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.COL: {
|
|
|
|
p._appendElement(token, html_js_1.NS.HTML);
|
|
|
|
token.ackSelfClosing = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
startTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
tokenInColumnGroup(p, token);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInColumnGroup(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.COLGROUP: {
|
|
|
|
if (p.openElements.currentTagId === html_js_1.TAG_ID.COLGROUP) {
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
endTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.COL: {
|
|
|
|
// Ignore token
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
tokenInColumnGroup(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function tokenInColumnGroup(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.openElements.currentTagId === html_js_1.TAG_ID.COLGROUP) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.pop();
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.IN_TABLE;
|
2020-12-18 22:06:30 +00:00
|
|
|
p._processToken(token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// The "in table body" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagInTableBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.TR: {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.clearBackToTableBodyContext();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.insertionMode = InsertionMode.IN_ROW;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.TH:
|
|
|
|
case html_js_1.TAG_ID.TD: {
|
|
|
|
p.openElements.clearBackToTableBodyContext();
|
|
|
|
p._insertFakeElement(html_js_1.TAG_NAMES.TR, html_js_1.TAG_ID.TR);
|
|
|
|
p.insertionMode = InsertionMode.IN_ROW;
|
|
|
|
startTagInRow(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.CAPTION:
|
|
|
|
case html_js_1.TAG_ID.COL:
|
|
|
|
case html_js_1.TAG_ID.COLGROUP:
|
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
case html_js_1.TAG_ID.THEAD: {
|
|
|
|
if (p.openElements.hasTableBodyContextInTableScope()) {
|
|
|
|
p.openElements.clearBackToTableBodyContext();
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE;
|
|
|
|
startTagInTable(p, token);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
startTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInTableBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
case html_js_1.TAG_ID.THEAD: {
|
|
|
|
if (p.openElements.hasInTableScope(tn)) {
|
|
|
|
p.openElements.clearBackToTableBodyContext();
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE;
|
|
|
|
}
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.TABLE: {
|
|
|
|
if (p.openElements.hasTableBodyContextInTableScope()) {
|
|
|
|
p.openElements.clearBackToTableBodyContext();
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE;
|
|
|
|
endTagInTable(p, token);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BODY:
|
|
|
|
case html_js_1.TAG_ID.CAPTION:
|
|
|
|
case html_js_1.TAG_ID.COL:
|
|
|
|
case html_js_1.TAG_ID.COLGROUP:
|
|
|
|
case html_js_1.TAG_ID.HTML:
|
|
|
|
case html_js_1.TAG_ID.TD:
|
|
|
|
case html_js_1.TAG_ID.TH:
|
|
|
|
case html_js_1.TAG_ID.TR: {
|
|
|
|
// Ignore token
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
endTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// The "in row" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagInRow(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.TH:
|
|
|
|
case html_js_1.TAG_ID.TD: {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.clearBackToTableRowContext();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
p.insertionMode = InsertionMode.IN_CELL;
|
|
|
|
p.activeFormattingElements.insertMarker();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.CAPTION:
|
|
|
|
case html_js_1.TAG_ID.COL:
|
|
|
|
case html_js_1.TAG_ID.COLGROUP:
|
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
case html_js_1.TAG_ID.THEAD:
|
|
|
|
case html_js_1.TAG_ID.TR: {
|
|
|
|
if (p.openElements.hasInTableScope(html_js_1.TAG_ID.TR)) {
|
|
|
|
p.openElements.clearBackToTableRowContext();
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE_BODY;
|
|
|
|
startTagInTableBody(p, token);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
startTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInRow(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.TR: {
|
|
|
|
if (p.openElements.hasInTableScope(html_js_1.TAG_ID.TR)) {
|
|
|
|
p.openElements.clearBackToTableRowContext();
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE_BODY;
|
|
|
|
}
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.TABLE: {
|
|
|
|
if (p.openElements.hasInTableScope(html_js_1.TAG_ID.TR)) {
|
|
|
|
p.openElements.clearBackToTableRowContext();
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE_BODY;
|
|
|
|
endTagInTableBody(p, token);
|
|
|
|
}
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
case html_js_1.TAG_ID.THEAD: {
|
|
|
|
if (p.openElements.hasInTableScope(token.tagID) || p.openElements.hasInTableScope(html_js_1.TAG_ID.TR)) {
|
|
|
|
p.openElements.clearBackToTableRowContext();
|
|
|
|
p.openElements.pop();
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE_BODY;
|
|
|
|
endTagInTableBody(p, token);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BODY:
|
|
|
|
case html_js_1.TAG_ID.CAPTION:
|
|
|
|
case html_js_1.TAG_ID.COL:
|
|
|
|
case html_js_1.TAG_ID.COLGROUP:
|
|
|
|
case html_js_1.TAG_ID.HTML:
|
|
|
|
case html_js_1.TAG_ID.TD:
|
|
|
|
case html_js_1.TAG_ID.TH: {
|
|
|
|
// Ignore end tag
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
default:
|
|
|
|
endTagInTable(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// The "in cell" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagInCell(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
|
|
|
if (TABLE_VOID_ELEMENTS.has(tn)) {
|
|
|
|
if (p.openElements.hasInTableScope(html_js_1.TAG_ID.TD) || p.openElements.hasInTableScope(html_js_1.TAG_ID.TH)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._closeTableCell();
|
2022-05-17 01:25:05 +00:00
|
|
|
startTagInRow(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
startTagInBody(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInCell(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
|
|
|
switch (tn) {
|
|
|
|
case html_js_1.TAG_ID.TD:
|
|
|
|
case html_js_1.TAG_ID.TH: {
|
|
|
|
if (p.openElements.hasInTableScope(tn)) {
|
|
|
|
p.openElements.generateImpliedEndTags();
|
|
|
|
p.openElements.popUntilTagNamePopped(tn);
|
|
|
|
p.activeFormattingElements.clearToLastMarker();
|
|
|
|
p.insertionMode = InsertionMode.IN_ROW;
|
|
|
|
}
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.TABLE:
|
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
case html_js_1.TAG_ID.THEAD:
|
|
|
|
case html_js_1.TAG_ID.TR: {
|
|
|
|
if (p.openElements.hasInTableScope(tn)) {
|
|
|
|
p._closeTableCell();
|
|
|
|
endTagInRow(p, token);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.BODY:
|
|
|
|
case html_js_1.TAG_ID.CAPTION:
|
|
|
|
case html_js_1.TAG_ID.COL:
|
|
|
|
case html_js_1.TAG_ID.COLGROUP:
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
// Ignore token
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
endTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// The "in select" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagInSelect(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
startTagInBody(p, token);
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.OPTION: {
|
|
|
|
if (p.openElements.currentTagId === html_js_1.TAG_ID.OPTION) {
|
|
|
|
p.openElements.pop();
|
|
|
|
}
|
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.OPTGROUP: {
|
|
|
|
if (p.openElements.currentTagId === html_js_1.TAG_ID.OPTION) {
|
|
|
|
p.openElements.pop();
|
|
|
|
}
|
|
|
|
if (p.openElements.currentTagId === html_js_1.TAG_ID.OPTGROUP) {
|
|
|
|
p.openElements.pop();
|
|
|
|
}
|
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.INPUT:
|
|
|
|
case html_js_1.TAG_ID.KEYGEN:
|
|
|
|
case html_js_1.TAG_ID.TEXTAREA:
|
|
|
|
case html_js_1.TAG_ID.SELECT: {
|
|
|
|
if (p.openElements.hasInSelectScope(html_js_1.TAG_ID.SELECT)) {
|
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.SELECT);
|
|
|
|
p._resetInsertionMode();
|
|
|
|
if (token.tagID !== html_js_1.TAG_ID.SELECT) {
|
|
|
|
p._processStartTag(token);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.SCRIPT:
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
startTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
// Do nothing
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInSelect(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.OPTGROUP: {
|
|
|
|
if (p.openElements.stackTop > 0 &&
|
|
|
|
p.openElements.currentTagId === html_js_1.TAG_ID.OPTION &&
|
|
|
|
p.openElements.tagIDs[p.openElements.stackTop - 1] === html_js_1.TAG_ID.OPTGROUP) {
|
|
|
|
p.openElements.pop();
|
|
|
|
}
|
|
|
|
if (p.openElements.currentTagId === html_js_1.TAG_ID.OPTGROUP) {
|
|
|
|
p.openElements.pop();
|
|
|
|
}
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.OPTION: {
|
|
|
|
if (p.openElements.currentTagId === html_js_1.TAG_ID.OPTION) {
|
|
|
|
p.openElements.pop();
|
|
|
|
}
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.SELECT: {
|
|
|
|
if (p.openElements.hasInSelectScope(html_js_1.TAG_ID.SELECT)) {
|
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.SELECT);
|
|
|
|
p._resetInsertionMode();
|
|
|
|
}
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.TAG_ID.TEMPLATE: {
|
|
|
|
endTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
// Do nothing
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
// The "in select in table" insertion mode
|
2020-12-18 22:06:30 +00:00
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagInSelectInTable(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
|
|
|
if (tn === html_js_1.TAG_ID.CAPTION ||
|
|
|
|
tn === html_js_1.TAG_ID.TABLE ||
|
|
|
|
tn === html_js_1.TAG_ID.TBODY ||
|
|
|
|
tn === html_js_1.TAG_ID.TFOOT ||
|
|
|
|
tn === html_js_1.TAG_ID.THEAD ||
|
|
|
|
tn === html_js_1.TAG_ID.TR ||
|
|
|
|
tn === html_js_1.TAG_ID.TD ||
|
|
|
|
tn === html_js_1.TAG_ID.TH) {
|
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.SELECT);
|
2020-12-18 22:06:30 +00:00
|
|
|
p._resetInsertionMode();
|
2022-05-17 01:25:05 +00:00
|
|
|
p._processStartTag(token);
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
startTagInSelect(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInSelectInTable(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = token.tagID;
|
|
|
|
if (tn === html_js_1.TAG_ID.CAPTION ||
|
|
|
|
tn === html_js_1.TAG_ID.TABLE ||
|
|
|
|
tn === html_js_1.TAG_ID.TBODY ||
|
|
|
|
tn === html_js_1.TAG_ID.TFOOT ||
|
|
|
|
tn === html_js_1.TAG_ID.THEAD ||
|
|
|
|
tn === html_js_1.TAG_ID.TR ||
|
|
|
|
tn === html_js_1.TAG_ID.TD ||
|
|
|
|
tn === html_js_1.TAG_ID.TH) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (p.openElements.hasInTableScope(tn)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.SELECT);
|
2020-12-18 22:06:30 +00:00
|
|
|
p._resetInsertionMode();
|
2022-05-17 01:25:05 +00:00
|
|
|
p.onEndTag(token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
endTagInSelect(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// The "in template" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagInTemplate(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
// First, handle tags that can start without a mode change
|
|
|
|
case html_js_1.TAG_ID.BASE:
|
|
|
|
case html_js_1.TAG_ID.BASEFONT:
|
|
|
|
case html_js_1.TAG_ID.BGSOUND:
|
|
|
|
case html_js_1.TAG_ID.LINK:
|
|
|
|
case html_js_1.TAG_ID.META:
|
|
|
|
case html_js_1.TAG_ID.NOFRAMES:
|
|
|
|
case html_js_1.TAG_ID.SCRIPT:
|
|
|
|
case html_js_1.TAG_ID.STYLE:
|
|
|
|
case html_js_1.TAG_ID.TEMPLATE:
|
|
|
|
case html_js_1.TAG_ID.TITLE:
|
|
|
|
startTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
// Re-process the token in the appropriate mode
|
|
|
|
case html_js_1.TAG_ID.CAPTION:
|
|
|
|
case html_js_1.TAG_ID.COLGROUP:
|
|
|
|
case html_js_1.TAG_ID.TBODY:
|
|
|
|
case html_js_1.TAG_ID.TFOOT:
|
|
|
|
case html_js_1.TAG_ID.THEAD:
|
|
|
|
p.tmplInsertionModeStack[0] = InsertionMode.IN_TABLE;
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE;
|
|
|
|
startTagInTable(p, token);
|
|
|
|
break;
|
|
|
|
case html_js_1.TAG_ID.COL:
|
|
|
|
p.tmplInsertionModeStack[0] = InsertionMode.IN_COLUMN_GROUP;
|
|
|
|
p.insertionMode = InsertionMode.IN_COLUMN_GROUP;
|
|
|
|
startTagInColumnGroup(p, token);
|
|
|
|
break;
|
|
|
|
case html_js_1.TAG_ID.TR:
|
|
|
|
p.tmplInsertionModeStack[0] = InsertionMode.IN_TABLE_BODY;
|
|
|
|
p.insertionMode = InsertionMode.IN_TABLE_BODY;
|
|
|
|
startTagInTableBody(p, token);
|
|
|
|
break;
|
|
|
|
case html_js_1.TAG_ID.TD:
|
|
|
|
case html_js_1.TAG_ID.TH:
|
|
|
|
p.tmplInsertionModeStack[0] = InsertionMode.IN_ROW;
|
|
|
|
p.insertionMode = InsertionMode.IN_ROW;
|
|
|
|
startTagInRow(p, token);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
p.tmplInsertionModeStack[0] = InsertionMode.IN_BODY;
|
|
|
|
p.insertionMode = InsertionMode.IN_BODY;
|
|
|
|
startTagInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInTemplate(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (token.tagID === html_js_1.TAG_ID.TEMPLATE) {
|
2020-12-18 22:06:30 +00:00
|
|
|
endTagInHead(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function eofInTemplate(p, token) {
|
|
|
|
if (p.openElements.tmplCount > 0) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p.openElements.popUntilTagNamePopped(html_js_1.TAG_ID.TEMPLATE);
|
2020-12-18 22:06:30 +00:00
|
|
|
p.activeFormattingElements.clearToLastMarker();
|
2022-05-17 01:25:05 +00:00
|
|
|
p.tmplInsertionModeStack.shift();
|
2020-12-18 22:06:30 +00:00
|
|
|
p._resetInsertionMode();
|
2022-05-17 01:25:05 +00:00
|
|
|
p.onEof(token);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
stopParsing(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// The "after body" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagAfterBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (token.tagID === html_js_1.TAG_ID.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
startTagInBody(p, token);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
tokenAfterBody(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagAfterBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
var _a;
|
|
|
|
if (token.tagID === html_js_1.TAG_ID.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (!p.fragmentContext) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.AFTER_AFTER_BODY;
|
|
|
|
}
|
|
|
|
//NOTE: <html> is never popped from the stack, so we need to updated
|
|
|
|
//the end location explicitly.
|
|
|
|
if (p.options.sourceCodeLocationInfo && p.openElements.tagIDs[0] === html_js_1.TAG_ID.HTML) {
|
|
|
|
p._setEndLocation(p.openElements.items[0], token);
|
|
|
|
// Update the body element, if it doesn't have an end tag
|
|
|
|
const bodyElement = p.openElements.items[1];
|
|
|
|
if (bodyElement && !((_a = p.treeAdapter.getNodeSourceCodeLocation(bodyElement)) === null || _a === void 0 ? void 0 : _a.endTag)) {
|
|
|
|
p._setEndLocation(bodyElement, token);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
tokenAfterBody(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function tokenAfterBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.IN_BODY;
|
|
|
|
modeInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
// The "in frameset" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagInFrameset(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
startTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.FRAMESET: {
|
|
|
|
p._insertElement(token, html_js_1.NS.HTML);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.FRAME: {
|
|
|
|
p._appendElement(token, html_js_1.NS.HTML);
|
|
|
|
token.ackSelfClosing = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.NOFRAMES: {
|
|
|
|
startTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
// Do nothing
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInFrameset(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (token.tagID === html_js_1.TAG_ID.FRAMESET && !p.openElements.isRootHtmlElementCurrent()) {
|
2020-12-18 22:06:30 +00:00
|
|
|
p.openElements.pop();
|
2022-05-17 01:25:05 +00:00
|
|
|
if (!p.fragmentContext && p.openElements.currentTagId !== html_js_1.TAG_ID.FRAMESET) {
|
|
|
|
p.insertionMode = InsertionMode.AFTER_FRAMESET;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// The "after frameset" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagAfterFrameset(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
startTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.NOFRAMES: {
|
|
|
|
startTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
// Do nothing
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagAfterFrameset(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (token.tagID === html_js_1.TAG_ID.HTML) {
|
|
|
|
p.insertionMode = InsertionMode.AFTER_AFTER_FRAMESET;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// The "after after body" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagAfterAfterBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (token.tagID === html_js_1.TAG_ID.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
startTagInBody(p, token);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
tokenAfterAfterBody(p, token);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function tokenAfterAfterBody(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
p.insertionMode = InsertionMode.IN_BODY;
|
|
|
|
modeInBody(p, token);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
// The "after after frameset" insertion mode
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function startTagAfterAfterFrameset(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
switch (token.tagID) {
|
|
|
|
case html_js_1.TAG_ID.HTML: {
|
|
|
|
startTagInBody(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.TAG_ID.NOFRAMES: {
|
|
|
|
startTagInHead(p, token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
// Do nothing
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// The rules for parsing tokens in foreign content
|
|
|
|
//------------------------------------------------------------------
|
|
|
|
function nullCharacterInForeignContent(p, token) {
|
|
|
|
token.chars = unicode.REPLACEMENT_CHARACTER;
|
|
|
|
p._insertCharacters(token);
|
|
|
|
}
|
|
|
|
function characterInForeignContent(p, token) {
|
|
|
|
p._insertCharacters(token);
|
|
|
|
p.framesetOk = false;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
function popUntilHtmlOrIntegrationPoint(p) {
|
|
|
|
while (p.treeAdapter.getNamespaceURI(p.openElements.current) !== html_js_1.NS.HTML &&
|
|
|
|
!p._isIntegrationPoint(p.openElements.currentTagId, p.openElements.current)) {
|
|
|
|
p.openElements.pop();
|
|
|
|
}
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
function startTagInForeignContent(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (foreignContent.causesExit(token)) {
|
|
|
|
popUntilHtmlOrIntegrationPoint(p);
|
|
|
|
p._startTagOutsideForeignContent(token);
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
const current = p._getAdjustedCurrentElement();
|
|
|
|
const currentNs = p.treeAdapter.getNamespaceURI(current);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (currentNs === html_js_1.NS.MATHML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
foreignContent.adjustTokenMathMLAttrs(token);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else if (currentNs === html_js_1.NS.SVG) {
|
2020-12-18 22:06:30 +00:00
|
|
|
foreignContent.adjustTokenSVGTagName(token);
|
|
|
|
foreignContent.adjustTokenSVGAttrs(token);
|
|
|
|
}
|
|
|
|
foreignContent.adjustTokenXMLAttrs(token);
|
|
|
|
if (token.selfClosing) {
|
|
|
|
p._appendElement(token, currentNs);
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
p._insertElement(token, currentNs);
|
|
|
|
}
|
|
|
|
token.ackSelfClosing = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
function endTagInForeignContent(p, token) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (token.tagID === html_js_1.TAG_ID.P || token.tagID === html_js_1.TAG_ID.BR) {
|
|
|
|
popUntilHtmlOrIntegrationPoint(p);
|
|
|
|
p._endTagOutsideForeignContent(token);
|
|
|
|
return;
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
for (let i = p.openElements.stackTop; i > 0; i--) {
|
|
|
|
const element = p.openElements.items[i];
|
2022-05-17 01:25:05 +00:00
|
|
|
if (p.treeAdapter.getNamespaceURI(element) === html_js_1.NS.HTML) {
|
|
|
|
p._endTagOutsideForeignContent(token);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
const tagName = p.treeAdapter.getTagName(element);
|
|
|
|
if (tagName.toLowerCase() === token.tagName) {
|
|
|
|
//NOTE: update the token tag name for `_setEndLocation`.
|
|
|
|
token.tagName = tagName;
|
|
|
|
p.openElements.shortenToLength(i);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-05-17 01:25:05 +00:00
|
|
|
},{"../common/doctype.js":1,"../common/error-codes.js":2,"../common/foreign-content.js":3,"../common/html.js":4,"../common/token.js":5,"../common/unicode.js":6,"../tokenizer/index.js":12,"../tree-adapters/default.js":14,"./formatting-element-list.js":8,"./open-element-stack.js":10}],10:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.OpenElementStack = void 0;
|
|
|
|
const html_js_1 = require("../common/html.js");
|
2020-12-18 22:06:30 +00:00
|
|
|
//Element utils
|
2022-05-17 01:25:05 +00:00
|
|
|
const IMPLICIT_END_TAG_REQUIRED = new Set([html_js_1.TAG_ID.DD, html_js_1.TAG_ID.DT, html_js_1.TAG_ID.LI, html_js_1.TAG_ID.OPTGROUP, html_js_1.TAG_ID.OPTION, html_js_1.TAG_ID.P, html_js_1.TAG_ID.RB, html_js_1.TAG_ID.RP, html_js_1.TAG_ID.RT, html_js_1.TAG_ID.RTC]);
|
|
|
|
const IMPLICIT_END_TAG_REQUIRED_THOROUGHLY = new Set([
|
|
|
|
...IMPLICIT_END_TAG_REQUIRED,
|
|
|
|
html_js_1.TAG_ID.CAPTION,
|
|
|
|
html_js_1.TAG_ID.COLGROUP,
|
|
|
|
html_js_1.TAG_ID.TBODY,
|
|
|
|
html_js_1.TAG_ID.TD,
|
|
|
|
html_js_1.TAG_ID.TFOOT,
|
|
|
|
html_js_1.TAG_ID.TH,
|
|
|
|
html_js_1.TAG_ID.THEAD,
|
|
|
|
html_js_1.TAG_ID.TR,
|
|
|
|
]);
|
|
|
|
const SCOPING_ELEMENT_NS = new Map([
|
|
|
|
[html_js_1.TAG_ID.APPLET, html_js_1.NS.HTML],
|
|
|
|
[html_js_1.TAG_ID.CAPTION, html_js_1.NS.HTML],
|
|
|
|
[html_js_1.TAG_ID.HTML, html_js_1.NS.HTML],
|
|
|
|
[html_js_1.TAG_ID.MARQUEE, html_js_1.NS.HTML],
|
|
|
|
[html_js_1.TAG_ID.OBJECT, html_js_1.NS.HTML],
|
|
|
|
[html_js_1.TAG_ID.TABLE, html_js_1.NS.HTML],
|
|
|
|
[html_js_1.TAG_ID.TD, html_js_1.NS.HTML],
|
|
|
|
[html_js_1.TAG_ID.TEMPLATE, html_js_1.NS.HTML],
|
|
|
|
[html_js_1.TAG_ID.TH, html_js_1.NS.HTML],
|
|
|
|
[html_js_1.TAG_ID.ANNOTATION_XML, html_js_1.NS.MATHML],
|
|
|
|
[html_js_1.TAG_ID.MI, html_js_1.NS.MATHML],
|
|
|
|
[html_js_1.TAG_ID.MN, html_js_1.NS.MATHML],
|
|
|
|
[html_js_1.TAG_ID.MO, html_js_1.NS.MATHML],
|
|
|
|
[html_js_1.TAG_ID.MS, html_js_1.NS.MATHML],
|
|
|
|
[html_js_1.TAG_ID.MTEXT, html_js_1.NS.MATHML],
|
|
|
|
[html_js_1.TAG_ID.DESC, html_js_1.NS.SVG],
|
|
|
|
[html_js_1.TAG_ID.FOREIGN_OBJECT, html_js_1.NS.SVG],
|
|
|
|
[html_js_1.TAG_ID.TITLE, html_js_1.NS.SVG],
|
|
|
|
]);
|
|
|
|
const NAMED_HEADERS = [html_js_1.TAG_ID.H1, html_js_1.TAG_ID.H2, html_js_1.TAG_ID.H3, html_js_1.TAG_ID.H4, html_js_1.TAG_ID.H5, html_js_1.TAG_ID.H6];
|
|
|
|
const TABLE_ROW_CONTEXT = [html_js_1.TAG_ID.TR, html_js_1.TAG_ID.TEMPLATE, html_js_1.TAG_ID.HTML];
|
|
|
|
const TABLE_BODY_CONTEXT = [html_js_1.TAG_ID.TBODY, html_js_1.TAG_ID.TFOOT, html_js_1.TAG_ID.THEAD, html_js_1.TAG_ID.TEMPLATE, html_js_1.TAG_ID.HTML];
|
|
|
|
const TABLE_CONTEXT = [html_js_1.TAG_ID.TABLE, html_js_1.TAG_ID.TEMPLATE, html_js_1.TAG_ID.HTML];
|
|
|
|
const TABLE_CELLS = [html_js_1.TAG_ID.TD, html_js_1.TAG_ID.TH];
|
2020-12-18 22:06:30 +00:00
|
|
|
//Stack of open elements
|
|
|
|
class OpenElementStack {
|
2022-05-17 01:25:05 +00:00
|
|
|
constructor(document, treeAdapter, handler) {
|
|
|
|
this.treeAdapter = treeAdapter;
|
|
|
|
this.handler = handler;
|
2020-12-18 22:06:30 +00:00
|
|
|
this.items = [];
|
2022-05-17 01:25:05 +00:00
|
|
|
this.tagIDs = [];
|
|
|
|
this.stackTop = -1;
|
2020-12-18 22:06:30 +00:00
|
|
|
this.tmplCount = 0;
|
2022-05-17 01:25:05 +00:00
|
|
|
this.currentTagId = html_js_1.TAG_ID.UNKNOWN;
|
|
|
|
this.current = document;
|
|
|
|
}
|
|
|
|
get currentTmplContentOrNode() {
|
|
|
|
return this._isInTemplate() ? this.treeAdapter.getTemplateContent(this.current) : this.current;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Index of element
|
|
|
|
_indexOf(element) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return this.items.lastIndexOf(element, this.stackTop);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Update current element
|
|
|
|
_isInTemplate() {
|
2022-05-17 01:25:05 +00:00
|
|
|
return this.currentTagId === html_js_1.TAG_ID.TEMPLATE && this.treeAdapter.getNamespaceURI(this.current) === html_js_1.NS.HTML;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_updateCurrentElement() {
|
|
|
|
this.current = this.items[this.stackTop];
|
2022-05-17 01:25:05 +00:00
|
|
|
this.currentTagId = this.tagIDs[this.stackTop];
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Mutations
|
2022-05-17 01:25:05 +00:00
|
|
|
push(element, tagID) {
|
|
|
|
this.stackTop++;
|
|
|
|
this.items[this.stackTop] = element;
|
|
|
|
this.current = element;
|
|
|
|
this.tagIDs[this.stackTop] = tagID;
|
|
|
|
this.currentTagId = tagID;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (this._isInTemplate()) {
|
|
|
|
this.tmplCount++;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.handler.onItemPush(element, tagID, true);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
pop() {
|
2022-05-17 01:25:05 +00:00
|
|
|
const popped = this.current;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (this.tmplCount > 0 && this._isInTemplate()) {
|
|
|
|
this.tmplCount--;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.stackTop--;
|
2020-12-18 22:06:30 +00:00
|
|
|
this._updateCurrentElement();
|
2022-05-17 01:25:05 +00:00
|
|
|
this.handler.onItemPop(popped, true);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
replace(oldElement, newElement) {
|
|
|
|
const idx = this._indexOf(oldElement);
|
|
|
|
this.items[idx] = newElement;
|
|
|
|
if (idx === this.stackTop) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.current = newElement;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
insertAfter(referenceElement, newElement, newElementID) {
|
2020-12-18 22:06:30 +00:00
|
|
|
const insertionIdx = this._indexOf(referenceElement) + 1;
|
|
|
|
this.items.splice(insertionIdx, 0, newElement);
|
2022-05-17 01:25:05 +00:00
|
|
|
this.tagIDs.splice(insertionIdx, 0, newElementID);
|
|
|
|
this.stackTop++;
|
|
|
|
if (insertionIdx === this.stackTop) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._updateCurrentElement();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.handler.onItemPush(this.current, this.currentTagId, insertionIdx === this.stackTop);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
popUntilTagNamePopped(tagName) {
|
2022-05-17 01:25:05 +00:00
|
|
|
let targetIdx = this.stackTop + 1;
|
|
|
|
do {
|
|
|
|
targetIdx = this.tagIDs.lastIndexOf(tagName, targetIdx - 1);
|
|
|
|
} while (targetIdx > 0 && this.treeAdapter.getNamespaceURI(this.items[targetIdx]) !== html_js_1.NS.HTML);
|
|
|
|
this.shortenToLength(targetIdx < 0 ? 0 : targetIdx);
|
|
|
|
}
|
|
|
|
shortenToLength(idx) {
|
|
|
|
while (this.stackTop >= idx) {
|
|
|
|
const popped = this.current;
|
|
|
|
if (this.tmplCount > 0 && this._isInTemplate()) {
|
|
|
|
this.tmplCount -= 1;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.stackTop--;
|
|
|
|
this._updateCurrentElement();
|
|
|
|
this.handler.onItemPop(popped, this.stackTop < idx);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
popUntilElementPopped(element) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const idx = this._indexOf(element);
|
|
|
|
this.shortenToLength(idx < 0 ? 0 : idx);
|
|
|
|
}
|
|
|
|
popUntilPopped(tagNames, targetNS) {
|
|
|
|
const idx = this._indexOfTagNames(tagNames, targetNS);
|
|
|
|
this.shortenToLength(idx < 0 ? 0 : idx);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
popUntilNumberedHeaderPopped() {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.popUntilPopped(NAMED_HEADERS, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
popUntilTableCellPopped() {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.popUntilPopped(TABLE_CELLS, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
popAllUpToHtmlElement() {
|
2022-05-17 01:25:05 +00:00
|
|
|
//NOTE: here we assume that the root <html> element is always first in the open element stack, so
|
2020-12-18 22:06:30 +00:00
|
|
|
//we perform this fast stack clean up.
|
2022-05-17 01:25:05 +00:00
|
|
|
this.tmplCount = 0;
|
|
|
|
this.shortenToLength(1);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_indexOfTagNames(tagNames, namespace) {
|
|
|
|
for (let i = this.stackTop; i >= 0; i--) {
|
|
|
|
if (tagNames.includes(this.tagIDs[i]) && this.treeAdapter.getNamespaceURI(this.items[i]) === namespace) {
|
|
|
|
return i;
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
clearBackTo(tagNames, targetNS) {
|
|
|
|
const idx = this._indexOfTagNames(tagNames, targetNS);
|
|
|
|
this.shortenToLength(idx + 1);
|
|
|
|
}
|
|
|
|
clearBackToTableContext() {
|
|
|
|
this.clearBackTo(TABLE_CONTEXT, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
clearBackToTableBodyContext() {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.clearBackTo(TABLE_BODY_CONTEXT, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
clearBackToTableRowContext() {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.clearBackTo(TABLE_ROW_CONTEXT, html_js_1.NS.HTML);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
remove(element) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const idx = this._indexOf(element);
|
|
|
|
if (idx >= 0) {
|
|
|
|
if (idx === this.stackTop) {
|
|
|
|
this.pop();
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this.items.splice(idx, 1);
|
|
|
|
this.tagIDs.splice(idx, 1);
|
2020-12-18 22:06:30 +00:00
|
|
|
this.stackTop--;
|
|
|
|
this._updateCurrentElement();
|
2022-05-17 01:25:05 +00:00
|
|
|
this.handler.onItemPop(element, false);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
//Search
|
|
|
|
tryPeekProperlyNestedBodyElement() {
|
|
|
|
//Properly nested <body> element (should be second element in stack).
|
2022-05-17 01:25:05 +00:00
|
|
|
return this.stackTop >= 1 && this.tagIDs[1] === html_js_1.TAG_ID.BODY ? this.items[1] : null;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
contains(element) {
|
|
|
|
return this._indexOf(element) > -1;
|
|
|
|
}
|
|
|
|
getCommonAncestor(element) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const elementIdx = this._indexOf(element) - 1;
|
|
|
|
return elementIdx >= 0 ? this.items[elementIdx] : null;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
isRootHtmlElementCurrent() {
|
2022-05-17 01:25:05 +00:00
|
|
|
return this.stackTop === 0 && this.tagIDs[0] === html_js_1.TAG_ID.HTML;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Element in scope
|
|
|
|
hasInScope(tagName) {
|
|
|
|
for (let i = this.stackTop; i >= 0; i--) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = this.tagIDs[i];
|
2020-12-18 22:06:30 +00:00
|
|
|
const ns = this.treeAdapter.getNamespaceURI(this.items[i]);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (tn === tagName && ns === html_js_1.NS.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return true;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (SCOPING_ELEMENT_NS.get(tn) === ns) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
hasNumberedHeaderInScope() {
|
|
|
|
for (let i = this.stackTop; i >= 0; i--) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = this.tagIDs[i];
|
2020-12-18 22:06:30 +00:00
|
|
|
const ns = this.treeAdapter.getNamespaceURI(this.items[i]);
|
2022-05-17 01:25:05 +00:00
|
|
|
if ((0, html_js_1.isNumberedHeader)(tn) && ns === html_js_1.NS.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return true;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (SCOPING_ELEMENT_NS.get(tn) === ns) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
hasInListItemScope(tagName) {
|
|
|
|
for (let i = this.stackTop; i >= 0; i--) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = this.tagIDs[i];
|
2020-12-18 22:06:30 +00:00
|
|
|
const ns = this.treeAdapter.getNamespaceURI(this.items[i]);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (tn === tagName && ns === html_js_1.NS.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return true;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (((tn === html_js_1.TAG_ID.UL || tn === html_js_1.TAG_ID.OL) && ns === html_js_1.NS.HTML) || SCOPING_ELEMENT_NS.get(tn) === ns) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
hasInButtonScope(tagName) {
|
|
|
|
for (let i = this.stackTop; i >= 0; i--) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = this.tagIDs[i];
|
2020-12-18 22:06:30 +00:00
|
|
|
const ns = this.treeAdapter.getNamespaceURI(this.items[i]);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (tn === tagName && ns === html_js_1.NS.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return true;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if ((tn === html_js_1.TAG_ID.BUTTON && ns === html_js_1.NS.HTML) || SCOPING_ELEMENT_NS.get(tn) === ns) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
hasInTableScope(tagName) {
|
|
|
|
for (let i = this.stackTop; i >= 0; i--) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = this.tagIDs[i];
|
2020-12-18 22:06:30 +00:00
|
|
|
const ns = this.treeAdapter.getNamespaceURI(this.items[i]);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (ns !== html_js_1.NS.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if (tn === tagName) {
|
|
|
|
return true;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (tn === html_js_1.TAG_ID.TABLE || tn === html_js_1.TAG_ID.TEMPLATE || tn === html_js_1.TAG_ID.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
hasTableBodyContextInTableScope() {
|
|
|
|
for (let i = this.stackTop; i >= 0; i--) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = this.tagIDs[i];
|
2020-12-18 22:06:30 +00:00
|
|
|
const ns = this.treeAdapter.getNamespaceURI(this.items[i]);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (ns !== html_js_1.NS.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
continue;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (tn === html_js_1.TAG_ID.TBODY || tn === html_js_1.TAG_ID.THEAD || tn === html_js_1.TAG_ID.TFOOT) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return true;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (tn === html_js_1.TAG_ID.TABLE || tn === html_js_1.TAG_ID.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
hasInSelectScope(tagName) {
|
|
|
|
for (let i = this.stackTop; i >= 0; i--) {
|
2022-05-17 01:25:05 +00:00
|
|
|
const tn = this.tagIDs[i];
|
2020-12-18 22:06:30 +00:00
|
|
|
const ns = this.treeAdapter.getNamespaceURI(this.items[i]);
|
2022-05-17 01:25:05 +00:00
|
|
|
if (ns !== html_js_1.NS.HTML) {
|
2020-12-18 22:06:30 +00:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if (tn === tagName) {
|
|
|
|
return true;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
if (tn !== html_js_1.TAG_ID.OPTION && tn !== html_js_1.TAG_ID.OPTGROUP) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
//Implied end tags
|
|
|
|
generateImpliedEndTags() {
|
2022-05-17 01:25:05 +00:00
|
|
|
while (IMPLICIT_END_TAG_REQUIRED.has(this.currentTagId)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.pop();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
generateImpliedEndTagsThoroughly() {
|
2022-05-17 01:25:05 +00:00
|
|
|
while (IMPLICIT_END_TAG_REQUIRED_THOROUGHLY.has(this.currentTagId)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.pop();
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
generateImpliedEndTagsWithExclusion(exclusionId) {
|
|
|
|
while (this.currentTagId !== exclusionId && IMPLICIT_END_TAG_REQUIRED_THOROUGHLY.has(this.currentTagId)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.pop();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
exports.OpenElementStack = OpenElementStack;
|
|
|
|
|
|
|
|
},{"../common/html.js":4}],11:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.serializeOuter = exports.serialize = void 0;
|
|
|
|
const html_js_1 = require("../common/html.js");
|
|
|
|
const escape_js_1 = require("entities/lib/escape.js");
|
|
|
|
const default_js_1 = require("../tree-adapters/default.js");
|
|
|
|
// Sets
|
|
|
|
const VOID_ELEMENTS = new Set([
|
|
|
|
html_js_1.TAG_NAMES.AREA,
|
|
|
|
html_js_1.TAG_NAMES.BASE,
|
|
|
|
html_js_1.TAG_NAMES.BASEFONT,
|
|
|
|
html_js_1.TAG_NAMES.BGSOUND,
|
|
|
|
html_js_1.TAG_NAMES.BR,
|
|
|
|
html_js_1.TAG_NAMES.COL,
|
|
|
|
html_js_1.TAG_NAMES.EMBED,
|
|
|
|
html_js_1.TAG_NAMES.FRAME,
|
|
|
|
html_js_1.TAG_NAMES.HR,
|
|
|
|
html_js_1.TAG_NAMES.IMG,
|
|
|
|
html_js_1.TAG_NAMES.INPUT,
|
|
|
|
html_js_1.TAG_NAMES.KEYGEN,
|
|
|
|
html_js_1.TAG_NAMES.LINK,
|
|
|
|
html_js_1.TAG_NAMES.META,
|
|
|
|
html_js_1.TAG_NAMES.PARAM,
|
|
|
|
html_js_1.TAG_NAMES.SOURCE,
|
|
|
|
html_js_1.TAG_NAMES.TRACK,
|
|
|
|
html_js_1.TAG_NAMES.WBR,
|
|
|
|
]);
|
|
|
|
function isVoidElement(node, options) {
|
|
|
|
return (options.treeAdapter.isElementNode(node) &&
|
|
|
|
options.treeAdapter.getNamespaceURI(node) === html_js_1.NS.HTML &&
|
|
|
|
VOID_ELEMENTS.has(options.treeAdapter.getTagName(node)));
|
|
|
|
}
|
|
|
|
const defaultOpts = { treeAdapter: default_js_1.defaultTreeAdapter, scriptingEnabled: true };
|
|
|
|
/**
|
|
|
|
* Serializes an AST node to an HTML string.
|
|
|
|
*
|
|
|
|
* @example
|
|
|
|
*
|
|
|
|
* ```js
|
|
|
|
* const parse5 = require('parse5');
|
|
|
|
*
|
|
|
|
* const document = parse5.parse('<!DOCTYPE html><html><head></head><body>Hi there!</body></html>');
|
|
|
|
*
|
|
|
|
* // Serializes a document.
|
|
|
|
* const html = parse5.serialize(document);
|
|
|
|
*
|
|
|
|
* // Serializes the <html> element content.
|
|
|
|
* const str = parse5.serialize(document.childNodes[1]);
|
|
|
|
*
|
|
|
|
* console.log(str); //> '<head></head><body>Hi there!</body>'
|
|
|
|
* ```
|
|
|
|
*
|
|
|
|
* @param node Node to serialize.
|
|
|
|
* @param options Serialization options.
|
|
|
|
*/
|
|
|
|
function serialize(node, options) {
|
|
|
|
const opts = Object.assign(Object.assign({}, defaultOpts), options);
|
|
|
|
if (isVoidElement(node, opts)) {
|
|
|
|
return '';
|
|
|
|
}
|
|
|
|
return serializeChildNodes(node, opts);
|
|
|
|
}
|
|
|
|
exports.serialize = serialize;
|
|
|
|
/**
|
|
|
|
* Serializes an AST element node to an HTML string, including the element node.
|
|
|
|
*
|
|
|
|
* @example
|
|
|
|
*
|
|
|
|
* ```js
|
|
|
|
* const parse5 = require('parse5');
|
|
|
|
*
|
|
|
|
* const document = parse5.parseFragment('<div>Hello, <b>world</b>!</div>');
|
|
|
|
*
|
|
|
|
* // Serializes the <div> element.
|
|
|
|
* const html = parse5.serializeOuter(document.childNodes[0]);
|
|
|
|
*
|
|
|
|
* console.log(str); //> '<div>Hello, <b>world</b>!</div>'
|
|
|
|
* ```
|
|
|
|
*
|
|
|
|
* @param node Node to serialize.
|
|
|
|
* @param options Serialization options.
|
|
|
|
*/
|
|
|
|
function serializeOuter(node, options) {
|
|
|
|
const opts = Object.assign(Object.assign({}, defaultOpts), options);
|
|
|
|
return serializeNode(node, opts);
|
|
|
|
}
|
|
|
|
exports.serializeOuter = serializeOuter;
|
|
|
|
function serializeChildNodes(parentNode, options) {
|
|
|
|
let html = '';
|
|
|
|
// Get container of the child nodes
|
|
|
|
const container = options.treeAdapter.isElementNode(parentNode) &&
|
|
|
|
options.treeAdapter.getTagName(parentNode) === html_js_1.TAG_NAMES.TEMPLATE &&
|
|
|
|
options.treeAdapter.getNamespaceURI(parentNode) === html_js_1.NS.HTML
|
|
|
|
? options.treeAdapter.getTemplateContent(parentNode)
|
|
|
|
: parentNode;
|
|
|
|
const childNodes = options.treeAdapter.getChildNodes(container);
|
|
|
|
if (childNodes) {
|
|
|
|
for (const currentNode of childNodes) {
|
|
|
|
html += serializeNode(currentNode, options);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return html;
|
|
|
|
}
|
|
|
|
function serializeNode(node, options) {
|
|
|
|
if (options.treeAdapter.isElementNode(node)) {
|
|
|
|
return serializeElement(node, options);
|
|
|
|
}
|
|
|
|
if (options.treeAdapter.isTextNode(node)) {
|
|
|
|
return serializeTextNode(node, options);
|
|
|
|
}
|
|
|
|
if (options.treeAdapter.isCommentNode(node)) {
|
|
|
|
return serializeCommentNode(node, options);
|
|
|
|
}
|
|
|
|
if (options.treeAdapter.isDocumentTypeNode(node)) {
|
|
|
|
return serializeDocumentTypeNode(node, options);
|
|
|
|
}
|
|
|
|
// Return an empty string for unknown nodes
|
|
|
|
return '';
|
|
|
|
}
|
|
|
|
function serializeElement(node, options) {
|
|
|
|
const tn = options.treeAdapter.getTagName(node);
|
|
|
|
return `<${tn}${serializeAttributes(node, options)}>${isVoidElement(node, options) ? '' : `${serializeChildNodes(node, options)}</${tn}>`}`;
|
|
|
|
}
|
|
|
|
function serializeAttributes(node, { treeAdapter }) {
|
|
|
|
let html = '';
|
|
|
|
for (const attr of treeAdapter.getAttrList(node)) {
|
|
|
|
html += ' ';
|
|
|
|
if (!attr.namespace) {
|
|
|
|
html += attr.name;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
switch (attr.namespace) {
|
|
|
|
case html_js_1.NS.XML: {
|
|
|
|
html += `xml:${attr.name}`;
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case html_js_1.NS.XMLNS: {
|
|
|
|
if (attr.name !== 'xmlns') {
|
|
|
|
html += 'xmlns:';
|
|
|
|
}
|
|
|
|
html += attr.name;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case html_js_1.NS.XLINK: {
|
|
|
|
html += `xlink:${attr.name}`;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
html += `${attr.prefix}:${attr.name}`;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
html += `="${(0, escape_js_1.escapeAttribute)(attr.value)}"`;
|
|
|
|
}
|
|
|
|
return html;
|
|
|
|
}
|
|
|
|
function serializeTextNode(node, options) {
|
|
|
|
const { treeAdapter } = options;
|
|
|
|
const content = treeAdapter.getTextNodeContent(node);
|
|
|
|
const parent = treeAdapter.getParentNode(node);
|
|
|
|
const parentTn = parent && treeAdapter.isElementNode(parent) && treeAdapter.getTagName(parent);
|
|
|
|
return parentTn &&
|
|
|
|
treeAdapter.getNamespaceURI(parent) === html_js_1.NS.HTML &&
|
|
|
|
(0, html_js_1.hasUnescapedText)(parentTn, options.scriptingEnabled)
|
|
|
|
? content
|
|
|
|
: (0, escape_js_1.escapeText)(content);
|
|
|
|
}
|
|
|
|
function serializeCommentNode(node, { treeAdapter }) {
|
|
|
|
return `<!--${treeAdapter.getCommentNodeContent(node)}-->`;
|
|
|
|
}
|
|
|
|
function serializeDocumentTypeNode(node, { treeAdapter }) {
|
|
|
|
return `<!DOCTYPE ${treeAdapter.getDocumentTypeNodeName(node)}>`;
|
|
|
|
}
|
|
|
|
|
|
|
|
},{"../common/html.js":4,"../tree-adapters/default.js":14,"entities/lib/escape.js":17}],12:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.Tokenizer = exports.TokenizerMode = void 0;
|
|
|
|
const preprocessor_js_1 = require("./preprocessor.js");
|
|
|
|
const unicode_js_1 = require("../common/unicode.js");
|
|
|
|
const token_js_1 = require("../common/token.js");
|
|
|
|
const decode_js_1 = require("entities/lib/decode.js");
|
|
|
|
const error_codes_js_1 = require("../common/error-codes.js");
|
|
|
|
const html_js_1 = require("../common/html.js");
|
2020-12-18 22:06:30 +00:00
|
|
|
//C1 Unicode control character reference replacements
|
2022-05-17 01:25:05 +00:00
|
|
|
const C1_CONTROLS_REFERENCE_REPLACEMENTS = new Map([
|
|
|
|
[0x80, 8364],
|
|
|
|
[0x82, 8218],
|
|
|
|
[0x83, 402],
|
|
|
|
[0x84, 8222],
|
|
|
|
[0x85, 8230],
|
|
|
|
[0x86, 8224],
|
|
|
|
[0x87, 8225],
|
|
|
|
[0x88, 710],
|
|
|
|
[0x89, 8240],
|
|
|
|
[0x8a, 352],
|
|
|
|
[0x8b, 8249],
|
|
|
|
[0x8c, 338],
|
|
|
|
[0x8e, 381],
|
|
|
|
[0x91, 8216],
|
|
|
|
[0x92, 8217],
|
|
|
|
[0x93, 8220],
|
|
|
|
[0x94, 8221],
|
|
|
|
[0x95, 8226],
|
|
|
|
[0x96, 8211],
|
|
|
|
[0x97, 8212],
|
|
|
|
[0x98, 732],
|
|
|
|
[0x99, 8482],
|
|
|
|
[0x9a, 353],
|
|
|
|
[0x9b, 8250],
|
|
|
|
[0x9c, 339],
|
|
|
|
[0x9e, 382],
|
|
|
|
[0x9f, 376],
|
|
|
|
]);
|
2020-12-18 22:06:30 +00:00
|
|
|
//States
|
2022-05-17 01:25:05 +00:00
|
|
|
var State;
|
|
|
|
(function (State) {
|
|
|
|
State[State["DATA"] = 0] = "DATA";
|
|
|
|
State[State["RCDATA"] = 1] = "RCDATA";
|
|
|
|
State[State["RAWTEXT"] = 2] = "RAWTEXT";
|
|
|
|
State[State["SCRIPT_DATA"] = 3] = "SCRIPT_DATA";
|
|
|
|
State[State["PLAINTEXT"] = 4] = "PLAINTEXT";
|
|
|
|
State[State["TAG_OPEN"] = 5] = "TAG_OPEN";
|
|
|
|
State[State["END_TAG_OPEN"] = 6] = "END_TAG_OPEN";
|
|
|
|
State[State["TAG_NAME"] = 7] = "TAG_NAME";
|
|
|
|
State[State["RCDATA_LESS_THAN_SIGN"] = 8] = "RCDATA_LESS_THAN_SIGN";
|
|
|
|
State[State["RCDATA_END_TAG_OPEN"] = 9] = "RCDATA_END_TAG_OPEN";
|
|
|
|
State[State["RCDATA_END_TAG_NAME"] = 10] = "RCDATA_END_TAG_NAME";
|
|
|
|
State[State["RAWTEXT_LESS_THAN_SIGN"] = 11] = "RAWTEXT_LESS_THAN_SIGN";
|
|
|
|
State[State["RAWTEXT_END_TAG_OPEN"] = 12] = "RAWTEXT_END_TAG_OPEN";
|
|
|
|
State[State["RAWTEXT_END_TAG_NAME"] = 13] = "RAWTEXT_END_TAG_NAME";
|
|
|
|
State[State["SCRIPT_DATA_LESS_THAN_SIGN"] = 14] = "SCRIPT_DATA_LESS_THAN_SIGN";
|
|
|
|
State[State["SCRIPT_DATA_END_TAG_OPEN"] = 15] = "SCRIPT_DATA_END_TAG_OPEN";
|
|
|
|
State[State["SCRIPT_DATA_END_TAG_NAME"] = 16] = "SCRIPT_DATA_END_TAG_NAME";
|
|
|
|
State[State["SCRIPT_DATA_ESCAPE_START"] = 17] = "SCRIPT_DATA_ESCAPE_START";
|
|
|
|
State[State["SCRIPT_DATA_ESCAPE_START_DASH"] = 18] = "SCRIPT_DATA_ESCAPE_START_DASH";
|
|
|
|
State[State["SCRIPT_DATA_ESCAPED"] = 19] = "SCRIPT_DATA_ESCAPED";
|
|
|
|
State[State["SCRIPT_DATA_ESCAPED_DASH"] = 20] = "SCRIPT_DATA_ESCAPED_DASH";
|
|
|
|
State[State["SCRIPT_DATA_ESCAPED_DASH_DASH"] = 21] = "SCRIPT_DATA_ESCAPED_DASH_DASH";
|
|
|
|
State[State["SCRIPT_DATA_ESCAPED_LESS_THAN_SIGN"] = 22] = "SCRIPT_DATA_ESCAPED_LESS_THAN_SIGN";
|
|
|
|
State[State["SCRIPT_DATA_ESCAPED_END_TAG_OPEN"] = 23] = "SCRIPT_DATA_ESCAPED_END_TAG_OPEN";
|
|
|
|
State[State["SCRIPT_DATA_ESCAPED_END_TAG_NAME"] = 24] = "SCRIPT_DATA_ESCAPED_END_TAG_NAME";
|
|
|
|
State[State["SCRIPT_DATA_DOUBLE_ESCAPE_START"] = 25] = "SCRIPT_DATA_DOUBLE_ESCAPE_START";
|
|
|
|
State[State["SCRIPT_DATA_DOUBLE_ESCAPED"] = 26] = "SCRIPT_DATA_DOUBLE_ESCAPED";
|
|
|
|
State[State["SCRIPT_DATA_DOUBLE_ESCAPED_DASH"] = 27] = "SCRIPT_DATA_DOUBLE_ESCAPED_DASH";
|
|
|
|
State[State["SCRIPT_DATA_DOUBLE_ESCAPED_DASH_DASH"] = 28] = "SCRIPT_DATA_DOUBLE_ESCAPED_DASH_DASH";
|
|
|
|
State[State["SCRIPT_DATA_DOUBLE_ESCAPED_LESS_THAN_SIGN"] = 29] = "SCRIPT_DATA_DOUBLE_ESCAPED_LESS_THAN_SIGN";
|
|
|
|
State[State["SCRIPT_DATA_DOUBLE_ESCAPE_END"] = 30] = "SCRIPT_DATA_DOUBLE_ESCAPE_END";
|
|
|
|
State[State["BEFORE_ATTRIBUTE_NAME"] = 31] = "BEFORE_ATTRIBUTE_NAME";
|
|
|
|
State[State["ATTRIBUTE_NAME"] = 32] = "ATTRIBUTE_NAME";
|
|
|
|
State[State["AFTER_ATTRIBUTE_NAME"] = 33] = "AFTER_ATTRIBUTE_NAME";
|
|
|
|
State[State["BEFORE_ATTRIBUTE_VALUE"] = 34] = "BEFORE_ATTRIBUTE_VALUE";
|
|
|
|
State[State["ATTRIBUTE_VALUE_DOUBLE_QUOTED"] = 35] = "ATTRIBUTE_VALUE_DOUBLE_QUOTED";
|
|
|
|
State[State["ATTRIBUTE_VALUE_SINGLE_QUOTED"] = 36] = "ATTRIBUTE_VALUE_SINGLE_QUOTED";
|
|
|
|
State[State["ATTRIBUTE_VALUE_UNQUOTED"] = 37] = "ATTRIBUTE_VALUE_UNQUOTED";
|
|
|
|
State[State["AFTER_ATTRIBUTE_VALUE_QUOTED"] = 38] = "AFTER_ATTRIBUTE_VALUE_QUOTED";
|
|
|
|
State[State["SELF_CLOSING_START_TAG"] = 39] = "SELF_CLOSING_START_TAG";
|
|
|
|
State[State["BOGUS_COMMENT"] = 40] = "BOGUS_COMMENT";
|
|
|
|
State[State["MARKUP_DECLARATION_OPEN"] = 41] = "MARKUP_DECLARATION_OPEN";
|
|
|
|
State[State["COMMENT_START"] = 42] = "COMMENT_START";
|
|
|
|
State[State["COMMENT_START_DASH"] = 43] = "COMMENT_START_DASH";
|
|
|
|
State[State["COMMENT"] = 44] = "COMMENT";
|
|
|
|
State[State["COMMENT_LESS_THAN_SIGN"] = 45] = "COMMENT_LESS_THAN_SIGN";
|
|
|
|
State[State["COMMENT_LESS_THAN_SIGN_BANG"] = 46] = "COMMENT_LESS_THAN_SIGN_BANG";
|
|
|
|
State[State["COMMENT_LESS_THAN_SIGN_BANG_DASH"] = 47] = "COMMENT_LESS_THAN_SIGN_BANG_DASH";
|
|
|
|
State[State["COMMENT_LESS_THAN_SIGN_BANG_DASH_DASH"] = 48] = "COMMENT_LESS_THAN_SIGN_BANG_DASH_DASH";
|
|
|
|
State[State["COMMENT_END_DASH"] = 49] = "COMMENT_END_DASH";
|
|
|
|
State[State["COMMENT_END"] = 50] = "COMMENT_END";
|
|
|
|
State[State["COMMENT_END_BANG"] = 51] = "COMMENT_END_BANG";
|
|
|
|
State[State["DOCTYPE"] = 52] = "DOCTYPE";
|
|
|
|
State[State["BEFORE_DOCTYPE_NAME"] = 53] = "BEFORE_DOCTYPE_NAME";
|
|
|
|
State[State["DOCTYPE_NAME"] = 54] = "DOCTYPE_NAME";
|
|
|
|
State[State["AFTER_DOCTYPE_NAME"] = 55] = "AFTER_DOCTYPE_NAME";
|
|
|
|
State[State["AFTER_DOCTYPE_PUBLIC_KEYWORD"] = 56] = "AFTER_DOCTYPE_PUBLIC_KEYWORD";
|
|
|
|
State[State["BEFORE_DOCTYPE_PUBLIC_IDENTIFIER"] = 57] = "BEFORE_DOCTYPE_PUBLIC_IDENTIFIER";
|
|
|
|
State[State["DOCTYPE_PUBLIC_IDENTIFIER_DOUBLE_QUOTED"] = 58] = "DOCTYPE_PUBLIC_IDENTIFIER_DOUBLE_QUOTED";
|
|
|
|
State[State["DOCTYPE_PUBLIC_IDENTIFIER_SINGLE_QUOTED"] = 59] = "DOCTYPE_PUBLIC_IDENTIFIER_SINGLE_QUOTED";
|
|
|
|
State[State["AFTER_DOCTYPE_PUBLIC_IDENTIFIER"] = 60] = "AFTER_DOCTYPE_PUBLIC_IDENTIFIER";
|
|
|
|
State[State["BETWEEN_DOCTYPE_PUBLIC_AND_SYSTEM_IDENTIFIERS"] = 61] = "BETWEEN_DOCTYPE_PUBLIC_AND_SYSTEM_IDENTIFIERS";
|
|
|
|
State[State["AFTER_DOCTYPE_SYSTEM_KEYWORD"] = 62] = "AFTER_DOCTYPE_SYSTEM_KEYWORD";
|
|
|
|
State[State["BEFORE_DOCTYPE_SYSTEM_IDENTIFIER"] = 63] = "BEFORE_DOCTYPE_SYSTEM_IDENTIFIER";
|
|
|
|
State[State["DOCTYPE_SYSTEM_IDENTIFIER_DOUBLE_QUOTED"] = 64] = "DOCTYPE_SYSTEM_IDENTIFIER_DOUBLE_QUOTED";
|
|
|
|
State[State["DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUOTED"] = 65] = "DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUOTED";
|
|
|
|
State[State["AFTER_DOCTYPE_SYSTEM_IDENTIFIER"] = 66] = "AFTER_DOCTYPE_SYSTEM_IDENTIFIER";
|
|
|
|
State[State["BOGUS_DOCTYPE"] = 67] = "BOGUS_DOCTYPE";
|
|
|
|
State[State["CDATA_SECTION"] = 68] = "CDATA_SECTION";
|
|
|
|
State[State["CDATA_SECTION_BRACKET"] = 69] = "CDATA_SECTION_BRACKET";
|
|
|
|
State[State["CDATA_SECTION_END"] = 70] = "CDATA_SECTION_END";
|
|
|
|
State[State["CHARACTER_REFERENCE"] = 71] = "CHARACTER_REFERENCE";
|
|
|
|
State[State["NAMED_CHARACTER_REFERENCE"] = 72] = "NAMED_CHARACTER_REFERENCE";
|
|
|
|
State[State["AMBIGUOUS_AMPERSAND"] = 73] = "AMBIGUOUS_AMPERSAND";
|
|
|
|
State[State["NUMERIC_CHARACTER_REFERENCE"] = 74] = "NUMERIC_CHARACTER_REFERENCE";
|
|
|
|
State[State["HEXADEMICAL_CHARACTER_REFERENCE_START"] = 75] = "HEXADEMICAL_CHARACTER_REFERENCE_START";
|
|
|
|
State[State["DECIMAL_CHARACTER_REFERENCE_START"] = 76] = "DECIMAL_CHARACTER_REFERENCE_START";
|
|
|
|
State[State["HEXADEMICAL_CHARACTER_REFERENCE"] = 77] = "HEXADEMICAL_CHARACTER_REFERENCE";
|
|
|
|
State[State["DECIMAL_CHARACTER_REFERENCE"] = 78] = "DECIMAL_CHARACTER_REFERENCE";
|
|
|
|
State[State["NUMERIC_CHARACTER_REFERENCE_END"] = 79] = "NUMERIC_CHARACTER_REFERENCE_END";
|
|
|
|
})(State || (State = {}));
|
|
|
|
//Tokenizer initial states for different modes
|
|
|
|
exports.TokenizerMode = {
|
|
|
|
DATA: State.DATA,
|
|
|
|
RCDATA: State.RCDATA,
|
|
|
|
RAWTEXT: State.RAWTEXT,
|
|
|
|
SCRIPT_DATA: State.SCRIPT_DATA,
|
|
|
|
PLAINTEXT: State.PLAINTEXT,
|
|
|
|
CDATA_SECTION: State.CDATA_SECTION,
|
|
|
|
};
|
2020-12-18 22:06:30 +00:00
|
|
|
//Utils
|
|
|
|
//OPTIMIZATION: these utility functions should not be moved out of this module. V8 Crankshaft will not inline
|
|
|
|
//this functions if they will be situated in another module due to context switch.
|
|
|
|
//Always perform inlining check before modifying this functions ('node --trace-inlining').
|
|
|
|
function isAsciiDigit(cp) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return cp >= unicode_js_1.CODE_POINTS.DIGIT_0 && cp <= unicode_js_1.CODE_POINTS.DIGIT_9;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function isAsciiUpper(cp) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return cp >= unicode_js_1.CODE_POINTS.LATIN_CAPITAL_A && cp <= unicode_js_1.CODE_POINTS.LATIN_CAPITAL_Z;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function isAsciiLower(cp) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return cp >= unicode_js_1.CODE_POINTS.LATIN_SMALL_A && cp <= unicode_js_1.CODE_POINTS.LATIN_SMALL_Z;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function isAsciiLetter(cp) {
|
|
|
|
return isAsciiLower(cp) || isAsciiUpper(cp);
|
|
|
|
}
|
|
|
|
function isAsciiAlphaNumeric(cp) {
|
|
|
|
return isAsciiLetter(cp) || isAsciiDigit(cp);
|
|
|
|
}
|
|
|
|
function isAsciiUpperHexDigit(cp) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return cp >= unicode_js_1.CODE_POINTS.LATIN_CAPITAL_A && cp <= unicode_js_1.CODE_POINTS.LATIN_CAPITAL_F;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function isAsciiLowerHexDigit(cp) {
|
2022-05-17 01:25:05 +00:00
|
|
|
return cp >= unicode_js_1.CODE_POINTS.LATIN_SMALL_A && cp <= unicode_js_1.CODE_POINTS.LATIN_SMALL_F;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
function isAsciiHexDigit(cp) {
|
|
|
|
return isAsciiDigit(cp) || isAsciiUpperHexDigit(cp) || isAsciiLowerHexDigit(cp);
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
function toAsciiLower(cp) {
|
|
|
|
return cp + 32;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
function isWhitespace(cp) {
|
|
|
|
return cp === unicode_js_1.CODE_POINTS.SPACE || cp === unicode_js_1.CODE_POINTS.LINE_FEED || cp === unicode_js_1.CODE_POINTS.TABULATION || cp === unicode_js_1.CODE_POINTS.FORM_FEED;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
function isEntityInAttributeInvalidEnd(nextCp) {
|
|
|
|
return nextCp === unicode_js_1.CODE_POINTS.EQUALS_SIGN || isAsciiAlphaNumeric(nextCp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
function isScriptDataDoubleEscapeSequenceEnd(cp) {
|
|
|
|
return isWhitespace(cp) || cp === unicode_js_1.CODE_POINTS.SOLIDUS || cp === unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Tokenizer
|
|
|
|
class Tokenizer {
|
2022-05-17 01:25:05 +00:00
|
|
|
constructor(options, handler) {
|
|
|
|
this.options = options;
|
|
|
|
this.handler = handler;
|
|
|
|
this.paused = false;
|
|
|
|
/** Ensures that the parsing loop isn't run multiple times at once. */
|
|
|
|
this.inLoop = false;
|
|
|
|
/**
|
|
|
|
* Indicates that the current adjusted node exists, is not an element in the HTML namespace,
|
|
|
|
* and that it is not an integration point for either MathML or HTML.
|
|
|
|
*
|
|
|
|
* @see {@link https://html.spec.whatwg.org/multipage/parsing.html#tree-construction}
|
|
|
|
*/
|
|
|
|
this.inForeignNode = false;
|
2020-12-18 22:06:30 +00:00
|
|
|
this.lastStartTagName = '';
|
|
|
|
this.active = false;
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.DATA;
|
|
|
|
this.returnState = State.DATA;
|
|
|
|
this.charRefCode = -1;
|
|
|
|
this.consumedAfterSnapshot = -1;
|
2020-12-18 22:06:30 +00:00
|
|
|
this.currentCharacterToken = null;
|
|
|
|
this.currentToken = null;
|
2022-05-17 01:25:05 +00:00
|
|
|
this.currentAttr = { name: '', value: '' };
|
|
|
|
this.preprocessor = new preprocessor_js_1.Preprocessor(handler);
|
|
|
|
this.currentLocation = this.getCurrentLocation(-1);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Errors
|
2022-05-17 01:25:05 +00:00
|
|
|
_err(code) {
|
|
|
|
var _a, _b;
|
|
|
|
(_b = (_a = this.handler).onParseError) === null || _b === void 0 ? void 0 : _b.call(_a, this.preprocessor.getError(code));
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
// NOTE: `offset` may never run across line boundaries.
|
|
|
|
getCurrentLocation(offset) {
|
|
|
|
if (!this.options.sourceCodeLocationInfo) {
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
return {
|
|
|
|
startLine: this.preprocessor.line,
|
|
|
|
startCol: this.preprocessor.col - offset,
|
|
|
|
startOffset: this.preprocessor.offset - offset,
|
|
|
|
endLine: -1,
|
|
|
|
endCol: -1,
|
|
|
|
endOffset: -1,
|
|
|
|
};
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_runParsingLoop() {
|
|
|
|
if (this.inLoop)
|
|
|
|
return;
|
|
|
|
this.inLoop = true;
|
|
|
|
while (this.active && !this.paused) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.consumedAfterSnapshot = 0;
|
|
|
|
const cp = this._consume();
|
|
|
|
if (!this._ensureHibernation()) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this._callState(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.inLoop = false;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
//API
|
|
|
|
pause() {
|
|
|
|
this.paused = true;
|
|
|
|
}
|
|
|
|
resume(writeCallback) {
|
|
|
|
if (!this.paused) {
|
|
|
|
throw new Error('Parser was already resumed');
|
|
|
|
}
|
|
|
|
this.paused = false;
|
|
|
|
// Necessary for synchronous resume.
|
|
|
|
if (this.inLoop)
|
|
|
|
return;
|
|
|
|
this._runParsingLoop();
|
|
|
|
if (!this.paused) {
|
|
|
|
writeCallback === null || writeCallback === void 0 ? void 0 : writeCallback();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
write(chunk, isLastChunk, writeCallback) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.active = true;
|
|
|
|
this.preprocessor.write(chunk, isLastChunk);
|
2022-05-17 01:25:05 +00:00
|
|
|
this._runParsingLoop();
|
|
|
|
if (!this.paused) {
|
|
|
|
writeCallback === null || writeCallback === void 0 ? void 0 : writeCallback();
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
insertHtmlAtCurrentPos(chunk) {
|
|
|
|
this.active = true;
|
|
|
|
this.preprocessor.insertHtmlAtCurrentPos(chunk);
|
2022-05-17 01:25:05 +00:00
|
|
|
this._runParsingLoop();
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Hibernation
|
|
|
|
_ensureHibernation() {
|
|
|
|
if (this.preprocessor.endOfChunkHit) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this._unconsume(this.consumedAfterSnapshot);
|
2020-12-18 22:06:30 +00:00
|
|
|
this.active = false;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
//Consumption
|
|
|
|
_consume() {
|
|
|
|
this.consumedAfterSnapshot++;
|
|
|
|
return this.preprocessor.advance();
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_unconsume(count) {
|
|
|
|
this.consumedAfterSnapshot -= count;
|
|
|
|
this.preprocessor.retreat(count);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_reconsumeInState(state) {
|
|
|
|
this.state = state;
|
2022-05-17 01:25:05 +00:00
|
|
|
this._unconsume(1);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_advanceBy(count) {
|
|
|
|
this.consumedAfterSnapshot += count;
|
|
|
|
for (let i = 0; i < count; i++) {
|
|
|
|
this.preprocessor.advance();
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_consumeSequenceIfMatch(pattern, caseSensitive) {
|
|
|
|
if (this.preprocessor.startsWith(pattern, caseSensitive)) {
|
|
|
|
// We will already have consumed one character before calling this method.
|
|
|
|
this._advanceBy(pattern.length - 1);
|
|
|
|
return true;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
return false;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Token creation
|
|
|
|
_createStartTagToken() {
|
|
|
|
this.currentToken = {
|
2022-05-17 01:25:05 +00:00
|
|
|
type: token_js_1.TokenType.START_TAG,
|
2020-12-18 22:06:30 +00:00
|
|
|
tagName: '',
|
2022-05-17 01:25:05 +00:00
|
|
|
tagID: html_js_1.TAG_ID.UNKNOWN,
|
2020-12-18 22:06:30 +00:00
|
|
|
selfClosing: false,
|
|
|
|
ackSelfClosing: false,
|
2022-05-17 01:25:05 +00:00
|
|
|
attrs: [],
|
|
|
|
location: this.getCurrentLocation(1),
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
|
|
|
}
|
|
|
|
_createEndTagToken() {
|
|
|
|
this.currentToken = {
|
2022-05-17 01:25:05 +00:00
|
|
|
type: token_js_1.TokenType.END_TAG,
|
2020-12-18 22:06:30 +00:00
|
|
|
tagName: '',
|
2022-05-17 01:25:05 +00:00
|
|
|
tagID: html_js_1.TAG_ID.UNKNOWN,
|
2020-12-18 22:06:30 +00:00
|
|
|
selfClosing: false,
|
2022-05-17 01:25:05 +00:00
|
|
|
ackSelfClosing: false,
|
|
|
|
attrs: [],
|
|
|
|
location: this.getCurrentLocation(2),
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_createCommentToken(offset) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.currentToken = {
|
2022-05-17 01:25:05 +00:00
|
|
|
type: token_js_1.TokenType.COMMENT,
|
|
|
|
data: '',
|
|
|
|
location: this.getCurrentLocation(offset),
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
|
|
|
}
|
|
|
|
_createDoctypeToken(initialName) {
|
|
|
|
this.currentToken = {
|
2022-05-17 01:25:05 +00:00
|
|
|
type: token_js_1.TokenType.DOCTYPE,
|
2020-12-18 22:06:30 +00:00
|
|
|
name: initialName,
|
|
|
|
forceQuirks: false,
|
|
|
|
publicId: null,
|
2022-05-17 01:25:05 +00:00
|
|
|
systemId: null,
|
|
|
|
location: this.currentLocation,
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_createCharacterToken(type, chars) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.currentCharacterToken = {
|
2022-05-17 01:25:05 +00:00
|
|
|
type,
|
|
|
|
chars,
|
|
|
|
location: this.currentLocation,
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
|
|
|
}
|
|
|
|
//Tag attributes
|
|
|
|
_createAttr(attrNameFirstCh) {
|
|
|
|
this.currentAttr = {
|
|
|
|
name: attrNameFirstCh,
|
2022-05-17 01:25:05 +00:00
|
|
|
value: '',
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
2022-05-17 01:25:05 +00:00
|
|
|
this.currentLocation = this.getCurrentLocation(0);
|
|
|
|
}
|
|
|
|
_leaveAttrName() {
|
|
|
|
var _a;
|
|
|
|
var _b;
|
|
|
|
const token = this.currentToken;
|
|
|
|
if ((0, token_js_1.getTokenAttr)(token, this.currentAttr.name) === null) {
|
|
|
|
token.attrs.push(this.currentAttr);
|
|
|
|
if (token.location && this.currentLocation) {
|
|
|
|
const attrLocations = ((_a = (_b = token.location).attrs) !== null && _a !== void 0 ? _a : (_b.attrs = Object.create(null)));
|
|
|
|
attrLocations[this.currentAttr.name] = this.currentLocation;
|
|
|
|
// Set end location
|
|
|
|
this._leaveAttrValue();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._err(error_codes_js_1.ERR.duplicateAttribute);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
_leaveAttrValue() {
|
|
|
|
if (this.currentLocation) {
|
|
|
|
this.currentLocation.endLine = this.preprocessor.line;
|
|
|
|
this.currentLocation.endCol = this.preprocessor.col;
|
|
|
|
this.currentLocation.endOffset = this.preprocessor.offset;
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Token emission
|
2022-05-17 01:25:05 +00:00
|
|
|
prepareToken(ct) {
|
|
|
|
this._emitCurrentCharacterToken(ct.location);
|
2020-12-18 22:06:30 +00:00
|
|
|
this.currentToken = null;
|
2022-05-17 01:25:05 +00:00
|
|
|
if (ct.location) {
|
|
|
|
ct.location.endLine = this.preprocessor.line;
|
|
|
|
ct.location.endCol = this.preprocessor.col + 1;
|
|
|
|
ct.location.endOffset = this.preprocessor.offset + 1;
|
|
|
|
}
|
|
|
|
this.currentLocation = this.getCurrentLocation(-1);
|
|
|
|
}
|
|
|
|
emitCurrentTagToken() {
|
|
|
|
const ct = this.currentToken;
|
|
|
|
this.prepareToken(ct);
|
|
|
|
ct.tagID = (0, html_js_1.getTagID)(ct.tagName);
|
|
|
|
if (ct.type === token_js_1.TokenType.START_TAG) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.lastStartTagName = ct.tagName;
|
2022-05-17 01:25:05 +00:00
|
|
|
this.handler.onStartTag(ct);
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (ct.attrs.length > 0) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this._err(error_codes_js_1.ERR.endTagWithAttributes);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
if (ct.selfClosing) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this._err(error_codes_js_1.ERR.endTagWithTrailingSolidus);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.handler.onEndTag(ct);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.preprocessor.dropParsedChunk();
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
emitCurrentComment(ct) {
|
|
|
|
this.prepareToken(ct);
|
|
|
|
this.handler.onComment(ct);
|
|
|
|
this.preprocessor.dropParsedChunk();
|
|
|
|
}
|
|
|
|
emitCurrentDoctype(ct) {
|
|
|
|
this.prepareToken(ct);
|
|
|
|
this.handler.onDoctype(ct);
|
|
|
|
this.preprocessor.dropParsedChunk();
|
|
|
|
}
|
|
|
|
_emitCurrentCharacterToken(nextLocation) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (this.currentCharacterToken) {
|
2022-05-17 01:25:05 +00:00
|
|
|
//NOTE: if we have a pending character token, make it's end location equal to the
|
|
|
|
//current token's start location.
|
|
|
|
if (nextLocation && this.currentCharacterToken.location) {
|
|
|
|
this.currentCharacterToken.location.endLine = nextLocation.startLine;
|
|
|
|
this.currentCharacterToken.location.endCol = nextLocation.startCol;
|
|
|
|
this.currentCharacterToken.location.endOffset = nextLocation.startOffset;
|
|
|
|
}
|
|
|
|
switch (this.currentCharacterToken.type) {
|
|
|
|
case token_js_1.TokenType.CHARACTER: {
|
|
|
|
this.handler.onCharacter(this.currentCharacterToken);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.NULL_CHARACTER: {
|
|
|
|
this.handler.onNullCharacter(this.currentCharacterToken);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case token_js_1.TokenType.WHITESPACE_CHARACTER: {
|
|
|
|
this.handler.onWhitespaceCharacter(this.currentCharacterToken);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
this.currentCharacterToken = null;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
_emitEOFToken() {
|
2022-05-17 01:25:05 +00:00
|
|
|
const location = this.getCurrentLocation(0);
|
|
|
|
if (location) {
|
|
|
|
location.endLine = location.startLine;
|
|
|
|
location.endCol = location.startCol;
|
|
|
|
location.endOffset = location.startOffset;
|
|
|
|
}
|
|
|
|
this._emitCurrentCharacterToken(location);
|
|
|
|
this.handler.onEof({ type: token_js_1.TokenType.EOF, location });
|
|
|
|
this.active = false;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//Characters emission
|
|
|
|
//OPTIMIZATION: specification uses only one type of character tokens (one token per character).
|
|
|
|
//This causes a huge memory overhead and a lot of unnecessary parser loops. parse5 uses 3 groups of characters.
|
2022-05-17 01:25:05 +00:00
|
|
|
//If we have a sequence of characters that belong to the same group, the parser can process it
|
2020-12-18 22:06:30 +00:00
|
|
|
//as a single solid character token.
|
|
|
|
//So, there are 3 types of character tokens in parse5:
|
2022-05-17 01:25:05 +00:00
|
|
|
//1)TokenType.NULL_CHARACTER - \u0000-character sequences (e.g. '\u0000\u0000\u0000')
|
|
|
|
//2)TokenType.WHITESPACE_CHARACTER - any whitespace/new-line character sequences (e.g. '\n \r\t \f')
|
|
|
|
//3)TokenType.CHARACTER - any character sequence which don't belong to groups 1 and 2 (e.g. 'abcdef1234@@#$%^')
|
2020-12-18 22:06:30 +00:00
|
|
|
_appendCharToCurrentCharacterToken(type, ch) {
|
|
|
|
if (this.currentCharacterToken) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (this.currentCharacterToken.type !== type) {
|
|
|
|
this.currentLocation = this.getCurrentLocation(0);
|
|
|
|
this._emitCurrentCharacterToken(this.currentLocation);
|
|
|
|
this.preprocessor.dropParsedChunk();
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this.currentCharacterToken.chars += ch;
|
|
|
|
return;
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this._createCharacterToken(type, ch);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_emitCodePoint(cp) {
|
2022-05-17 01:25:05 +00:00
|
|
|
let type = token_js_1.TokenType.CHARACTER;
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isWhitespace(cp)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
type = token_js_1.TokenType.WHITESPACE_CHARACTER;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
else if (cp === unicode_js_1.CODE_POINTS.NULL) {
|
|
|
|
type = token_js_1.TokenType.NULL_CHARACTER;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this._appendCharToCurrentCharacterToken(type, String.fromCodePoint(cp));
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
//NOTE: used when we emit characters explicitly.
|
|
|
|
//This is always for non-whitespace and non-null characters, which allows us to avoid additional checks.
|
2020-12-18 22:06:30 +00:00
|
|
|
_emitChars(ch) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this._appendCharToCurrentCharacterToken(token_js_1.TokenType.CHARACTER, ch);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
// Character reference helpers
|
2022-05-17 01:25:05 +00:00
|
|
|
_matchNamedCharacterReference(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
let result = null;
|
2022-05-17 01:25:05 +00:00
|
|
|
let excess = 0;
|
|
|
|
let withoutSemicolon = false;
|
|
|
|
for (let i = 0, current = decode_js_1.htmlDecodeTree[0]; i >= 0; cp = this._consume()) {
|
|
|
|
i = (0, decode_js_1.determineBranch)(decode_js_1.htmlDecodeTree, current, i + 1, cp);
|
|
|
|
if (i < 0)
|
|
|
|
break;
|
|
|
|
excess += 1;
|
|
|
|
current = decode_js_1.htmlDecodeTree[i];
|
|
|
|
const masked = current & decode_js_1.BinTrieFlags.VALUE_LENGTH;
|
|
|
|
// If the branch is a value, store it and continue
|
|
|
|
if (masked) {
|
|
|
|
// The mask is the number of bytes of the value, including the current byte.
|
|
|
|
const valueLength = (masked >> 14) - 1;
|
|
|
|
// Attribute values that aren't terminated properly aren't parsed, and shouldn't lead to a parser error.
|
|
|
|
// See the example in https://html.spec.whatwg.org/multipage/parsing.html#named-character-reference-state
|
|
|
|
if (cp !== unicode_js_1.CODE_POINTS.SEMICOLON &&
|
|
|
|
this._isCharacterReferenceInAttribute() &&
|
|
|
|
isEntityInAttributeInvalidEnd(this.preprocessor.peek(1))) {
|
|
|
|
//NOTE: we don't flush all consumed code points here, and instead switch back to the original state after
|
|
|
|
//emitting an ampersand. This is fine, as alphanumeric characters won't be parsed differently in attributes.
|
|
|
|
result = [unicode_js_1.CODE_POINTS.AMPERSAND];
|
|
|
|
// Skip over the value.
|
|
|
|
i += valueLength;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
// If this is a surrogate pair, consume the next two bytes.
|
|
|
|
result =
|
|
|
|
valueLength === 0
|
|
|
|
? [decode_js_1.htmlDecodeTree[i] & ~decode_js_1.BinTrieFlags.VALUE_LENGTH]
|
|
|
|
: valueLength === 1
|
|
|
|
? [decode_js_1.htmlDecodeTree[++i]]
|
|
|
|
: [decode_js_1.htmlDecodeTree[++i], decode_js_1.htmlDecodeTree[++i]];
|
|
|
|
excess = 0;
|
|
|
|
withoutSemicolon = cp !== unicode_js_1.CODE_POINTS.SEMICOLON;
|
|
|
|
}
|
|
|
|
if (valueLength === 0) {
|
|
|
|
// If the value is zero-length, we're done.
|
|
|
|
this._consume();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
this._unconsume(excess);
|
|
|
|
if (withoutSemicolon && !this.preprocessor.endOfChunkHit) {
|
|
|
|
this._err(error_codes_js_1.ERR.missingSemicolonAfterCharacterReference);
|
|
|
|
}
|
|
|
|
// We want to emit the error above on the code point after the entity.
|
|
|
|
// We always consume one code point too many in the loop, and we wait to
|
|
|
|
// unconsume it until after the error is emitted.
|
|
|
|
this._unconsume(1);
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
_isCharacterReferenceInAttribute() {
|
|
|
|
return (this.returnState === State.ATTRIBUTE_VALUE_DOUBLE_QUOTED ||
|
|
|
|
this.returnState === State.ATTRIBUTE_VALUE_SINGLE_QUOTED ||
|
|
|
|
this.returnState === State.ATTRIBUTE_VALUE_UNQUOTED);
|
|
|
|
}
|
|
|
|
_flushCodePointConsumedAsCharacterReference(cp) {
|
|
|
|
if (this._isCharacterReferenceInAttribute()) {
|
|
|
|
this.currentAttr.value += String.fromCodePoint(cp);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// Calling states this way turns out to be much faster than any other approach.
|
|
|
|
_callState(cp) {
|
|
|
|
switch (this.state) {
|
|
|
|
case State.DATA: {
|
|
|
|
this._stateData(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.RCDATA: {
|
|
|
|
this._stateRcdata(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.RAWTEXT: {
|
|
|
|
this._stateRawtext(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA: {
|
|
|
|
this._stateScriptData(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.PLAINTEXT: {
|
|
|
|
this._statePlaintext(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.TAG_OPEN: {
|
|
|
|
this._stateTagOpen(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.END_TAG_OPEN: {
|
|
|
|
this._stateEndTagOpen(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.TAG_NAME: {
|
|
|
|
this._stateTagName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.RCDATA_LESS_THAN_SIGN: {
|
|
|
|
this._stateRcdataLessThanSign(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.RCDATA_END_TAG_OPEN: {
|
|
|
|
this._stateRcdataEndTagOpen(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.RCDATA_END_TAG_NAME: {
|
|
|
|
this._stateRcdataEndTagName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.RAWTEXT_LESS_THAN_SIGN: {
|
|
|
|
this._stateRawtextLessThanSign(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.RAWTEXT_END_TAG_OPEN: {
|
|
|
|
this._stateRawtextEndTagOpen(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.RAWTEXT_END_TAG_NAME: {
|
|
|
|
this._stateRawtextEndTagName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_LESS_THAN_SIGN: {
|
|
|
|
this._stateScriptDataLessThanSign(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_END_TAG_OPEN: {
|
|
|
|
this._stateScriptDataEndTagOpen(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_END_TAG_NAME: {
|
|
|
|
this._stateScriptDataEndTagName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_ESCAPE_START: {
|
|
|
|
this._stateScriptDataEscapeStart(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_ESCAPE_START_DASH: {
|
|
|
|
this._stateScriptDataEscapeStartDash(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_ESCAPED: {
|
|
|
|
this._stateScriptDataEscaped(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_ESCAPED_DASH: {
|
|
|
|
this._stateScriptDataEscapedDash(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_ESCAPED_DASH_DASH: {
|
|
|
|
this._stateScriptDataEscapedDashDash(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_ESCAPED_LESS_THAN_SIGN: {
|
|
|
|
this._stateScriptDataEscapedLessThanSign(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_ESCAPED_END_TAG_OPEN: {
|
|
|
|
this._stateScriptDataEscapedEndTagOpen(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_ESCAPED_END_TAG_NAME: {
|
|
|
|
this._stateScriptDataEscapedEndTagName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_DOUBLE_ESCAPE_START: {
|
|
|
|
this._stateScriptDataDoubleEscapeStart(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_DOUBLE_ESCAPED: {
|
|
|
|
this._stateScriptDataDoubleEscaped(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_DOUBLE_ESCAPED_DASH: {
|
|
|
|
this._stateScriptDataDoubleEscapedDash(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_DOUBLE_ESCAPED_DASH_DASH: {
|
|
|
|
this._stateScriptDataDoubleEscapedDashDash(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_DOUBLE_ESCAPED_LESS_THAN_SIGN: {
|
|
|
|
this._stateScriptDataDoubleEscapedLessThanSign(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SCRIPT_DATA_DOUBLE_ESCAPE_END: {
|
|
|
|
this._stateScriptDataDoubleEscapeEnd(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.BEFORE_ATTRIBUTE_NAME: {
|
|
|
|
this._stateBeforeAttributeName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.ATTRIBUTE_NAME: {
|
|
|
|
this._stateAttributeName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.AFTER_ATTRIBUTE_NAME: {
|
|
|
|
this._stateAfterAttributeName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.BEFORE_ATTRIBUTE_VALUE: {
|
|
|
|
this._stateBeforeAttributeValue(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.ATTRIBUTE_VALUE_DOUBLE_QUOTED: {
|
|
|
|
this._stateAttributeValueDoubleQuoted(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.ATTRIBUTE_VALUE_SINGLE_QUOTED: {
|
|
|
|
this._stateAttributeValueSingleQuoted(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.ATTRIBUTE_VALUE_UNQUOTED: {
|
|
|
|
this._stateAttributeValueUnquoted(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.AFTER_ATTRIBUTE_VALUE_QUOTED: {
|
|
|
|
this._stateAfterAttributeValueQuoted(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.SELF_CLOSING_START_TAG: {
|
|
|
|
this._stateSelfClosingStartTag(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.BOGUS_COMMENT: {
|
|
|
|
this._stateBogusComment(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.MARKUP_DECLARATION_OPEN: {
|
|
|
|
this._stateMarkupDeclarationOpen(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.COMMENT_START: {
|
|
|
|
this._stateCommentStart(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.COMMENT_START_DASH: {
|
|
|
|
this._stateCommentStartDash(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.COMMENT: {
|
|
|
|
this._stateComment(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.COMMENT_LESS_THAN_SIGN: {
|
|
|
|
this._stateCommentLessThanSign(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.COMMENT_LESS_THAN_SIGN_BANG: {
|
|
|
|
this._stateCommentLessThanSignBang(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.COMMENT_LESS_THAN_SIGN_BANG_DASH: {
|
|
|
|
this._stateCommentLessThanSignBangDash(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.COMMENT_LESS_THAN_SIGN_BANG_DASH_DASH: {
|
|
|
|
this._stateCommentLessThanSignBangDashDash(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.COMMENT_END_DASH: {
|
|
|
|
this._stateCommentEndDash(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.COMMENT_END: {
|
|
|
|
this._stateCommentEnd(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.COMMENT_END_BANG: {
|
|
|
|
this._stateCommentEndBang(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.DOCTYPE: {
|
|
|
|
this._stateDoctype(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.BEFORE_DOCTYPE_NAME: {
|
|
|
|
this._stateBeforeDoctypeName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.DOCTYPE_NAME: {
|
|
|
|
this._stateDoctypeName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.AFTER_DOCTYPE_NAME: {
|
|
|
|
this._stateAfterDoctypeName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.AFTER_DOCTYPE_PUBLIC_KEYWORD: {
|
|
|
|
this._stateAfterDoctypePublicKeyword(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.BEFORE_DOCTYPE_PUBLIC_IDENTIFIER: {
|
|
|
|
this._stateBeforeDoctypePublicIdentifier(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.DOCTYPE_PUBLIC_IDENTIFIER_DOUBLE_QUOTED: {
|
|
|
|
this._stateDoctypePublicIdentifierDoubleQuoted(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.DOCTYPE_PUBLIC_IDENTIFIER_SINGLE_QUOTED: {
|
|
|
|
this._stateDoctypePublicIdentifierSingleQuoted(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.AFTER_DOCTYPE_PUBLIC_IDENTIFIER: {
|
|
|
|
this._stateAfterDoctypePublicIdentifier(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.BETWEEN_DOCTYPE_PUBLIC_AND_SYSTEM_IDENTIFIERS: {
|
|
|
|
this._stateBetweenDoctypePublicAndSystemIdentifiers(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.AFTER_DOCTYPE_SYSTEM_KEYWORD: {
|
|
|
|
this._stateAfterDoctypeSystemKeyword(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.BEFORE_DOCTYPE_SYSTEM_IDENTIFIER: {
|
|
|
|
this._stateBeforeDoctypeSystemIdentifier(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.DOCTYPE_SYSTEM_IDENTIFIER_DOUBLE_QUOTED: {
|
|
|
|
this._stateDoctypeSystemIdentifierDoubleQuoted(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUOTED: {
|
|
|
|
this._stateDoctypeSystemIdentifierSingleQuoted(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.AFTER_DOCTYPE_SYSTEM_IDENTIFIER: {
|
|
|
|
this._stateAfterDoctypeSystemIdentifier(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.BOGUS_DOCTYPE: {
|
|
|
|
this._stateBogusDoctype(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.CDATA_SECTION: {
|
|
|
|
this._stateCdataSection(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.CDATA_SECTION_BRACKET: {
|
|
|
|
this._stateCdataSectionBracket(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.CDATA_SECTION_END: {
|
|
|
|
this._stateCdataSectionEnd(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.CHARACTER_REFERENCE: {
|
|
|
|
this._stateCharacterReference(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.NAMED_CHARACTER_REFERENCE: {
|
|
|
|
this._stateNamedCharacterReference(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.AMBIGUOUS_AMPERSAND: {
|
|
|
|
this._stateAmbiguousAmpersand(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.NUMERIC_CHARACTER_REFERENCE: {
|
|
|
|
this._stateNumericCharacterReference(cp);
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case State.HEXADEMICAL_CHARACTER_REFERENCE_START: {
|
|
|
|
this._stateHexademicalCharacterReferenceStart(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
break;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case State.DECIMAL_CHARACTER_REFERENCE_START: {
|
|
|
|
this._stateDecimalCharacterReferenceStart(cp);
|
|
|
|
break;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
case State.HEXADEMICAL_CHARACTER_REFERENCE: {
|
|
|
|
this._stateHexademicalCharacterReference(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.DECIMAL_CHARACTER_REFERENCE: {
|
|
|
|
this._stateDecimalCharacterReference(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case State.NUMERIC_CHARACTER_REFERENCE_END: {
|
|
|
|
this._stateNumericCharacterReferenceEnd();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
throw new Error('Unknown state');
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// State machine
|
|
|
|
// Data state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateData(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this.state = State.TAG_OPEN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.AMPERSAND: {
|
|
|
|
this.returnState = State.DATA;
|
|
|
|
this.state = State.CHARACTER_REFERENCE;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// RCDATA state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateRcdata(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.AMPERSAND: {
|
|
|
|
this.returnState = State.RCDATA;
|
|
|
|
this.state = State.CHARACTER_REFERENCE;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this.state = State.RCDATA_LESS_THAN_SIGN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this._emitChars(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// RAWTEXT state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateRawtext(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this.state = State.RAWTEXT_LESS_THAN_SIGN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this._emitChars(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptData(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this.state = State.SCRIPT_DATA_LESS_THAN_SIGN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this._emitChars(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// PLAINTEXT state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_statePlaintext(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this._emitChars(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Tag open state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateTagOpen(cp) {
|
|
|
|
if (isAsciiLetter(cp)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._createStartTagToken();
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.TAG_NAME;
|
|
|
|
this._stateTagName(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
else
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.EXCLAMATION_MARK: {
|
|
|
|
this.state = State.MARKUP_DECLARATION_OPEN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.SOLIDUS: {
|
|
|
|
this.state = State.END_TAG_OPEN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.QUESTION_MARK: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedQuestionMarkInsteadOfTagName);
|
|
|
|
this._createCommentToken(1);
|
|
|
|
this.state = State.BOGUS_COMMENT;
|
|
|
|
this._stateBogusComment(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofBeforeTagName);
|
|
|
|
this._emitChars('<');
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.invalidFirstCharacterOfTagName);
|
|
|
|
this._emitChars('<');
|
|
|
|
this.state = State.DATA;
|
|
|
|
this._stateData(cp);
|
|
|
|
}
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
// End tag open state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateEndTagOpen(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiLetter(cp)) {
|
|
|
|
this._createEndTagToken();
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.TAG_NAME;
|
|
|
|
this._stateTagName(cp);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingEndTagName);
|
|
|
|
this.state = State.DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofBeforeTagName);
|
|
|
|
this._emitChars('</');
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.invalidFirstCharacterOfTagName);
|
|
|
|
this._createCommentToken(2);
|
|
|
|
this.state = State.BOGUS_COMMENT;
|
|
|
|
this._stateBogusComment(cp);
|
|
|
|
}
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
// Tag name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateTagName(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
this.state = State.BEFORE_ATTRIBUTE_NAME;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.SOLIDUS: {
|
|
|
|
this.state = State.SELF_CLOSING_START_TAG;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentTagToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
token.tagName += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInTag);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.tagName += String.fromCodePoint(isAsciiUpper(cp) ? toAsciiLower(cp) : cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// RCDATA less-than sign state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateRcdataLessThanSign(cp) {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.SOLIDUS) {
|
|
|
|
this.state = State.RCDATA_END_TAG_OPEN;
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('<');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.RCDATA;
|
|
|
|
this._stateRcdata(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// RCDATA end tag open state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateRcdataEndTagOpen(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiLetter(cp)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.RCDATA_END_TAG_NAME;
|
|
|
|
this._stateRcdataEndTagName(cp);
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('</');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.RCDATA;
|
|
|
|
this._stateRcdata(cp);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
handleSpecialEndTag(_cp) {
|
|
|
|
if (!this.preprocessor.startsWith(this.lastStartTagName, false)) {
|
|
|
|
return !this._ensureHibernation();
|
|
|
|
}
|
|
|
|
this._createEndTagToken();
|
|
|
|
const token = this.currentToken;
|
|
|
|
token.tagName = this.lastStartTagName;
|
|
|
|
const cp = this.preprocessor.peek(this.lastStartTagName.length);
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
this._advanceBy(this.lastStartTagName.length);
|
|
|
|
this.state = State.BEFORE_ATTRIBUTE_NAME;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.SOLIDUS: {
|
|
|
|
this._advanceBy(this.lastStartTagName.length);
|
|
|
|
this.state = State.SELF_CLOSING_START_TAG;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._advanceBy(this.lastStartTagName.length);
|
|
|
|
this.emitCurrentTagToken();
|
|
|
|
this.state = State.DATA;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
return !this._ensureHibernation();
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// RCDATA end tag name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateRcdataEndTagName(cp) {
|
|
|
|
if (this.handleSpecialEndTag(cp)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('</');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.RCDATA;
|
|
|
|
this._stateRcdata(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// RAWTEXT less-than sign state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateRawtextLessThanSign(cp) {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.SOLIDUS) {
|
|
|
|
this.state = State.RAWTEXT_END_TAG_OPEN;
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('<');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.RAWTEXT;
|
|
|
|
this._stateRawtext(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// RAWTEXT end tag open state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateRawtextEndTagOpen(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiLetter(cp)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.RAWTEXT_END_TAG_NAME;
|
|
|
|
this._stateRawtextEndTagName(cp);
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('</');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.RAWTEXT;
|
|
|
|
this._stateRawtext(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// RAWTEXT end tag name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateRawtextEndTagName(cp) {
|
|
|
|
if (this.handleSpecialEndTag(cp)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('</');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.RAWTEXT;
|
|
|
|
this._stateRawtext(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data less-than sign state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataLessThanSign(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SOLIDUS: {
|
|
|
|
this.state = State.SCRIPT_DATA_END_TAG_OPEN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EXCLAMATION_MARK: {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPE_START;
|
|
|
|
this._emitChars('<!');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._emitChars('<');
|
|
|
|
this.state = State.SCRIPT_DATA;
|
|
|
|
this._stateScriptData(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data end tag open state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataEndTagOpen(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiLetter(cp)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.SCRIPT_DATA_END_TAG_NAME;
|
|
|
|
this._stateScriptDataEndTagName(cp);
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('</');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.SCRIPT_DATA;
|
|
|
|
this._stateScriptData(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data end tag name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataEndTagName(cp) {
|
|
|
|
if (this.handleSpecialEndTag(cp)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('</');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.SCRIPT_DATA;
|
|
|
|
this._stateScriptData(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data escape start state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataEscapeStart(cp) {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.HYPHEN_MINUS) {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPE_START_DASH;
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('-');
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
this.state = State.SCRIPT_DATA;
|
|
|
|
this._stateScriptData(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data escape start dash state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataEscapeStartDash(cp) {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.HYPHEN_MINUS) {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED_DASH_DASH;
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('-');
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
this.state = State.SCRIPT_DATA;
|
|
|
|
this._stateScriptData(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data escaped state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataEscaped(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED_DASH;
|
|
|
|
this._emitChars('-');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED_LESS_THAN_SIGN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this._emitChars(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInScriptHtmlCommentLikeText);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data escaped dash state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataEscapedDash(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED_DASH_DASH;
|
|
|
|
this._emitChars('-');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED_LESS_THAN_SIGN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED;
|
|
|
|
this._emitChars(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInScriptHtmlCommentLikeText);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED;
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data escaped dash dash state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataEscapedDashDash(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
this._emitChars('-');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED_LESS_THAN_SIGN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.SCRIPT_DATA;
|
|
|
|
this._emitChars('>');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED;
|
|
|
|
this._emitChars(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInScriptHtmlCommentLikeText);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED;
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data escaped less-than sign state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataEscapedLessThanSign(cp) {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.SOLIDUS) {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED_END_TAG_OPEN;
|
|
|
|
}
|
|
|
|
else if (isAsciiLetter(cp)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('<');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPE_START;
|
|
|
|
this._stateScriptDataDoubleEscapeStart(cp);
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('<');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED;
|
|
|
|
this._stateScriptDataEscaped(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data escaped end tag open state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataEscapedEndTagOpen(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiLetter(cp)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED_END_TAG_NAME;
|
|
|
|
this._stateScriptDataEscapedEndTagName(cp);
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('</');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED;
|
|
|
|
this._stateScriptDataEscaped(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data escaped end tag name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataEscapedEndTagName(cp) {
|
|
|
|
if (this.handleSpecialEndTag(cp)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('</');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED;
|
|
|
|
this._stateScriptDataEscaped(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data double escape start state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataDoubleEscapeStart(cp) {
|
|
|
|
if (this.preprocessor.startsWith(unicode_js_1.SEQUENCES.SCRIPT, false) &&
|
|
|
|
isScriptDataDoubleEscapeSequenceEnd(this.preprocessor.peek(unicode_js_1.SEQUENCES.SCRIPT.length))) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitCodePoint(cp);
|
2022-05-17 01:25:05 +00:00
|
|
|
for (let i = 0; i < unicode_js_1.SEQUENCES.SCRIPT.length; i++) {
|
|
|
|
this._emitCodePoint(this._consume());
|
|
|
|
}
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED;
|
|
|
|
}
|
|
|
|
else if (!this._ensureHibernation()) {
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED;
|
|
|
|
this._stateScriptDataEscaped(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data double escaped state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataDoubleEscaped(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED_DASH;
|
|
|
|
this._emitChars('-');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED_LESS_THAN_SIGN;
|
|
|
|
this._emitChars('<');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this._emitChars(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInScriptHtmlCommentLikeText);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data double escaped dash state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataDoubleEscapedDash(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED_DASH_DASH;
|
|
|
|
this._emitChars('-');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED_LESS_THAN_SIGN;
|
|
|
|
this._emitChars('<');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED;
|
|
|
|
this._emitChars(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInScriptHtmlCommentLikeText);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED;
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data double escaped dash dash state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataDoubleEscapedDashDash(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
this._emitChars('-');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED_LESS_THAN_SIGN;
|
|
|
|
this._emitChars('<');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.SCRIPT_DATA;
|
|
|
|
this._emitChars('>');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED;
|
|
|
|
this._emitChars(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInScriptHtmlCommentLikeText);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED;
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data double escaped less-than sign state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataDoubleEscapedLessThanSign(cp) {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.SOLIDUS) {
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPE_END;
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars('/');
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED;
|
|
|
|
this._stateScriptDataDoubleEscaped(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Script data double escape end state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateScriptDataDoubleEscapeEnd(cp) {
|
|
|
|
if (this.preprocessor.startsWith(unicode_js_1.SEQUENCES.SCRIPT, false) &&
|
|
|
|
isScriptDataDoubleEscapeSequenceEnd(this.preprocessor.peek(unicode_js_1.SEQUENCES.SCRIPT.length))) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitCodePoint(cp);
|
2022-05-17 01:25:05 +00:00
|
|
|
for (let i = 0; i < unicode_js_1.SEQUENCES.SCRIPT.length; i++) {
|
|
|
|
this._emitCodePoint(this._consume());
|
|
|
|
}
|
|
|
|
this.state = State.SCRIPT_DATA_ESCAPED;
|
|
|
|
}
|
|
|
|
else if (!this._ensureHibernation()) {
|
|
|
|
this.state = State.SCRIPT_DATA_DOUBLE_ESCAPED;
|
|
|
|
this._stateScriptDataDoubleEscaped(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Before attribute name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateBeforeAttributeName(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
// Ignore whitespace
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.SOLIDUS:
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN:
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this.state = State.AFTER_ATTRIBUTE_NAME;
|
|
|
|
this._stateAfterAttributeName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EQUALS_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedEqualsSignBeforeAttributeName);
|
|
|
|
this._createAttr('=');
|
|
|
|
this.state = State.ATTRIBUTE_NAME;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._createAttr('');
|
|
|
|
this.state = State.ATTRIBUTE_NAME;
|
|
|
|
this._stateAttributeName(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Attribute name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAttributeName(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.SOLIDUS:
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN:
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._leaveAttrName();
|
|
|
|
this.state = State.AFTER_ATTRIBUTE_NAME;
|
|
|
|
this._stateAfterAttributeName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EQUALS_SIGN: {
|
|
|
|
this._leaveAttrName();
|
|
|
|
this.state = State.BEFORE_ATTRIBUTE_VALUE;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK:
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedCharacterInAttributeName);
|
|
|
|
this.currentAttr.name += String.fromCodePoint(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this.currentAttr.name += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.currentAttr.name += String.fromCodePoint(isAsciiUpper(cp) ? toAsciiLower(cp) : cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// After attribute name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAfterAttributeName(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
// Ignore whitespace
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.SOLIDUS: {
|
|
|
|
this.state = State.SELF_CLOSING_START_TAG;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EQUALS_SIGN: {
|
|
|
|
this.state = State.BEFORE_ATTRIBUTE_VALUE;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentTagToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInTag);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._createAttr('');
|
|
|
|
this.state = State.ATTRIBUTE_NAME;
|
|
|
|
this._stateAttributeName(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Before attribute value state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateBeforeAttributeValue(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
// Ignore whitespace
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK: {
|
|
|
|
this.state = State.ATTRIBUTE_VALUE_DOUBLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE: {
|
|
|
|
this.state = State.ATTRIBUTE_VALUE_SINGLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingAttributeValue);
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentTagToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.state = State.ATTRIBUTE_VALUE_UNQUOTED;
|
|
|
|
this._stateAttributeValueUnquoted(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Attribute value (double-quoted) state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAttributeValueDoubleQuoted(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK: {
|
|
|
|
this.state = State.AFTER_ATTRIBUTE_VALUE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.AMPERSAND: {
|
|
|
|
this.returnState = State.ATTRIBUTE_VALUE_DOUBLE_QUOTED;
|
|
|
|
this.state = State.CHARACTER_REFERENCE;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this.currentAttr.value += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInTag);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.currentAttr.value += String.fromCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Attribute value (single-quoted) state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAttributeValueSingleQuoted(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE: {
|
|
|
|
this.state = State.AFTER_ATTRIBUTE_VALUE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.AMPERSAND: {
|
|
|
|
this.returnState = State.ATTRIBUTE_VALUE_SINGLE_QUOTED;
|
|
|
|
this.state = State.CHARACTER_REFERENCE;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this.currentAttr.value += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInTag);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.currentAttr.value += String.fromCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Attribute value (unquoted) state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAttributeValueUnquoted(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
this._leaveAttrValue();
|
|
|
|
this.state = State.BEFORE_ATTRIBUTE_NAME;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.AMPERSAND: {
|
|
|
|
this.returnState = State.ATTRIBUTE_VALUE_UNQUOTED;
|
|
|
|
this.state = State.CHARACTER_REFERENCE;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._leaveAttrValue();
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentTagToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this.currentAttr.value += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK:
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN:
|
|
|
|
case unicode_js_1.CODE_POINTS.EQUALS_SIGN:
|
|
|
|
case unicode_js_1.CODE_POINTS.GRAVE_ACCENT: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedCharacterInUnquotedAttributeValue);
|
|
|
|
this.currentAttr.value += String.fromCodePoint(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInTag);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.currentAttr.value += String.fromCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// After attribute value (quoted) state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAfterAttributeValueQuoted(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
this._leaveAttrValue();
|
|
|
|
this.state = State.BEFORE_ATTRIBUTE_NAME;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.SOLIDUS: {
|
|
|
|
this._leaveAttrValue();
|
|
|
|
this.state = State.SELF_CLOSING_START_TAG;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._leaveAttrValue();
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentTagToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInTag);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingWhitespaceBetweenAttributes);
|
|
|
|
this.state = State.BEFORE_ATTRIBUTE_NAME;
|
|
|
|
this._stateBeforeAttributeName(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Self-closing start tag state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateSelfClosingStartTag(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
const token = this.currentToken;
|
|
|
|
token.selfClosing = true;
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentTagToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInTag);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedSolidusInTag);
|
|
|
|
this.state = State.BEFORE_ATTRIBUTE_NAME;
|
|
|
|
this._stateBeforeAttributeName(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Bogus comment state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateBogusComment(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
token.data += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.data += String.fromCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Markup declaration open state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateMarkupDeclarationOpen(cp) {
|
|
|
|
if (this._consumeSequenceIfMatch(unicode_js_1.SEQUENCES.DASH_DASH, true)) {
|
|
|
|
this._createCommentToken(unicode_js_1.SEQUENCES.DASH_DASH.length + 1);
|
|
|
|
this.state = State.COMMENT_START;
|
|
|
|
}
|
|
|
|
else if (this._consumeSequenceIfMatch(unicode_js_1.SEQUENCES.DOCTYPE, false)) {
|
|
|
|
// NOTE: Doctypes tokens are created without fixed offsets. We keep track of the moment a doctype *might* start here.
|
|
|
|
this.currentLocation = this.getCurrentLocation(unicode_js_1.SEQUENCES.DOCTYPE.length + 1);
|
|
|
|
this.state = State.DOCTYPE;
|
|
|
|
}
|
|
|
|
else if (this._consumeSequenceIfMatch(unicode_js_1.SEQUENCES.CDATA_START, true)) {
|
|
|
|
if (this.inForeignNode) {
|
|
|
|
this.state = State.CDATA_SECTION;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._err(error_codes_js_1.ERR.cdataInHtmlContent);
|
|
|
|
this._createCommentToken(unicode_js_1.SEQUENCES.CDATA_START.length + 1);
|
2020-12-18 22:06:30 +00:00
|
|
|
this.currentToken.data = '[CDATA[';
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.BOGUS_COMMENT;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
//NOTE: Sequence lookups can be abrupted by hibernation. In that case, lookup
|
2020-12-18 22:06:30 +00:00
|
|
|
//results are no longer valid and we will need to start over.
|
|
|
|
else if (!this._ensureHibernation()) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this._err(error_codes_js_1.ERR.incorrectlyOpenedComment);
|
|
|
|
this._createCommentToken(2);
|
|
|
|
this.state = State.BOGUS_COMMENT;
|
|
|
|
this._stateBogusComment(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Comment start state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCommentStart(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
this.state = State.COMMENT_START_DASH;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.abruptClosingOfEmptyComment);
|
|
|
|
this.state = State.DATA;
|
|
|
|
const token = this.currentToken;
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.state = State.COMMENT;
|
|
|
|
this._stateComment(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Comment start dash state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCommentStartDash(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
this.state = State.COMMENT_END;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.abruptClosingOfEmptyComment);
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInComment);
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.data += '-';
|
|
|
|
this.state = State.COMMENT;
|
|
|
|
this._stateComment(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Comment state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateComment(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
this.state = State.COMMENT_END_DASH;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
token.data += '<';
|
|
|
|
this.state = State.COMMENT_LESS_THAN_SIGN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
token.data += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInComment);
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.data += String.fromCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Comment less-than sign state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCommentLessThanSign(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.EXCLAMATION_MARK: {
|
|
|
|
token.data += '!';
|
|
|
|
this.state = State.COMMENT_LESS_THAN_SIGN_BANG;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.LESS_THAN_SIGN: {
|
|
|
|
token.data += '<';
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this.state = State.COMMENT;
|
|
|
|
this._stateComment(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Comment less-than sign bang state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCommentLessThanSignBang(cp) {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.HYPHEN_MINUS) {
|
|
|
|
this.state = State.COMMENT_LESS_THAN_SIGN_BANG_DASH;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this.state = State.COMMENT;
|
|
|
|
this._stateComment(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Comment less-than sign bang dash state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCommentLessThanSignBangDash(cp) {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.HYPHEN_MINUS) {
|
|
|
|
this.state = State.COMMENT_LESS_THAN_SIGN_BANG_DASH_DASH;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this.state = State.COMMENT_END_DASH;
|
|
|
|
this._stateCommentEndDash(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Comment less-than sign bang dash dash state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCommentLessThanSignBangDashDash(cp) {
|
|
|
|
if (cp !== unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN && cp !== unicode_js_1.CODE_POINTS.EOF) {
|
|
|
|
this._err(error_codes_js_1.ERR.nestedComment);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.COMMENT_END;
|
|
|
|
this._stateCommentEnd(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
// Comment end dash state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCommentEndDash(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
this.state = State.COMMENT_END;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInComment);
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.data += '-';
|
|
|
|
this.state = State.COMMENT;
|
|
|
|
this._stateComment(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Comment end state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCommentEnd(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EXCLAMATION_MARK: {
|
|
|
|
this.state = State.COMMENT_END_BANG;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
token.data += '-';
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInComment);
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.data += '--';
|
|
|
|
this.state = State.COMMENT;
|
|
|
|
this._stateComment(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Comment end bang state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCommentEndBang(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.HYPHEN_MINUS: {
|
|
|
|
token.data += '--!';
|
|
|
|
this.state = State.COMMENT_END_DASH;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.incorrectlyClosedComment);
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInComment);
|
|
|
|
this.emitCurrentComment(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.data += '--!';
|
|
|
|
this.state = State.COMMENT;
|
|
|
|
this._stateComment(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// DOCTYPE state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateDoctype(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
this.state = State.BEFORE_DOCTYPE_NAME;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.BEFORE_DOCTYPE_NAME;
|
|
|
|
this._stateBeforeDoctypeName(cp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
this._createDoctypeToken(null);
|
|
|
|
const token = this.currentToken;
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingWhitespaceBeforeDoctypeName);
|
|
|
|
this.state = State.BEFORE_DOCTYPE_NAME;
|
|
|
|
this._stateBeforeDoctypeName(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Before DOCTYPE name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateBeforeDoctypeName(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiUpper(cp)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this._createDoctypeToken(String.fromCharCode(toAsciiLower(cp)));
|
|
|
|
this.state = State.DOCTYPE_NAME;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
// Ignore whitespace
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
this._createDoctypeToken(unicode_js_1.REPLACEMENT_CHARACTER);
|
|
|
|
this.state = State.DOCTYPE_NAME;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingDoctypeName);
|
|
|
|
this._createDoctypeToken(null);
|
|
|
|
const token = this.currentToken;
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this.state = State.DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
this._createDoctypeToken(null);
|
|
|
|
const token = this.currentToken;
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._createDoctypeToken(String.fromCodePoint(cp));
|
|
|
|
this.state = State.DOCTYPE_NAME;
|
|
|
|
}
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
// DOCTYPE name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateDoctypeName(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
this.state = State.AFTER_DOCTYPE_NAME;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
token.name += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.name += String.fromCodePoint(isAsciiUpper(cp) ? toAsciiLower(cp) : cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// After DOCTYPE name state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAfterDoctypeName(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
// Ignore whitespace
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
if (this._consumeSequenceIfMatch(unicode_js_1.SEQUENCES.PUBLIC, false)) {
|
|
|
|
this.state = State.AFTER_DOCTYPE_PUBLIC_KEYWORD;
|
|
|
|
}
|
|
|
|
else if (this._consumeSequenceIfMatch(unicode_js_1.SEQUENCES.SYSTEM, false)) {
|
|
|
|
this.state = State.AFTER_DOCTYPE_SYSTEM_KEYWORD;
|
|
|
|
}
|
|
|
|
//NOTE: sequence lookup can be abrupted by hibernation. In that case lookup
|
|
|
|
//results are no longer valid and we will need to start over.
|
|
|
|
else if (!this._ensureHibernation()) {
|
|
|
|
this._err(error_codes_js_1.ERR.invalidCharacterSequenceAfterDoctypeName);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.BOGUS_DOCTYPE;
|
|
|
|
this._stateBogusDoctype(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// After DOCTYPE public keyword state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAfterDoctypePublicKeyword(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
this.state = State.BEFORE_DOCTYPE_PUBLIC_IDENTIFIER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingWhitespaceAfterDoctypePublicKeyword);
|
|
|
|
token.publicId = '';
|
|
|
|
this.state = State.DOCTYPE_PUBLIC_IDENTIFIER_DOUBLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingWhitespaceAfterDoctypePublicKeyword);
|
|
|
|
token.publicId = '';
|
|
|
|
this.state = State.DOCTYPE_PUBLIC_IDENTIFIER_SINGLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingDoctypePublicIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingQuoteBeforeDoctypePublicIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.BOGUS_DOCTYPE;
|
|
|
|
this._stateBogusDoctype(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Before DOCTYPE public identifier state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateBeforeDoctypePublicIdentifier(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
// Ignore whitespace
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK: {
|
|
|
|
token.publicId = '';
|
|
|
|
this.state = State.DOCTYPE_PUBLIC_IDENTIFIER_DOUBLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE: {
|
|
|
|
token.publicId = '';
|
|
|
|
this.state = State.DOCTYPE_PUBLIC_IDENTIFIER_SINGLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingDoctypePublicIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingQuoteBeforeDoctypePublicIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.BOGUS_DOCTYPE;
|
|
|
|
this._stateBogusDoctype(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// DOCTYPE public identifier (double-quoted) state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateDoctypePublicIdentifierDoubleQuoted(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK: {
|
|
|
|
this.state = State.AFTER_DOCTYPE_PUBLIC_IDENTIFIER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
token.publicId += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.abruptDoctypePublicIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this.state = State.DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.publicId += String.fromCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// DOCTYPE public identifier (single-quoted) state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateDoctypePublicIdentifierSingleQuoted(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE: {
|
|
|
|
this.state = State.AFTER_DOCTYPE_PUBLIC_IDENTIFIER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
token.publicId += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.abruptDoctypePublicIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this.state = State.DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.publicId += String.fromCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// After DOCTYPE public identifier state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAfterDoctypePublicIdentifier(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
this.state = State.BETWEEN_DOCTYPE_PUBLIC_AND_SYSTEM_IDENTIFIERS;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingWhitespaceBetweenDoctypePublicAndSystemIdentifiers);
|
|
|
|
token.systemId = '';
|
|
|
|
this.state = State.DOCTYPE_SYSTEM_IDENTIFIER_DOUBLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingWhitespaceBetweenDoctypePublicAndSystemIdentifiers);
|
|
|
|
token.systemId = '';
|
|
|
|
this.state = State.DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingQuoteBeforeDoctypeSystemIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.BOGUS_DOCTYPE;
|
|
|
|
this._stateBogusDoctype(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Between DOCTYPE public and system identifiers state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateBetweenDoctypePublicAndSystemIdentifiers(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
// Ignore whitespace
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this.state = State.DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK: {
|
|
|
|
token.systemId = '';
|
|
|
|
this.state = State.DOCTYPE_SYSTEM_IDENTIFIER_DOUBLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE: {
|
|
|
|
token.systemId = '';
|
|
|
|
this.state = State.DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingQuoteBeforeDoctypeSystemIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.BOGUS_DOCTYPE;
|
|
|
|
this._stateBogusDoctype(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// After DOCTYPE system keyword state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAfterDoctypeSystemKeyword(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
this.state = State.BEFORE_DOCTYPE_SYSTEM_IDENTIFIER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingWhitespaceAfterDoctypeSystemKeyword);
|
|
|
|
token.systemId = '';
|
|
|
|
this.state = State.DOCTYPE_SYSTEM_IDENTIFIER_DOUBLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingWhitespaceAfterDoctypeSystemKeyword);
|
|
|
|
token.systemId = '';
|
|
|
|
this.state = State.DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingDoctypeSystemIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingQuoteBeforeDoctypeSystemIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.BOGUS_DOCTYPE;
|
|
|
|
this._stateBogusDoctype(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Before DOCTYPE system identifier state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateBeforeDoctypeSystemIdentifier(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
// Ignore whitespace
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK: {
|
|
|
|
token.systemId = '';
|
|
|
|
this.state = State.DOCTYPE_SYSTEM_IDENTIFIER_DOUBLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE: {
|
|
|
|
token.systemId = '';
|
|
|
|
this.state = State.DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUOTED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingDoctypeSystemIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.DATA;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.missingQuoteBeforeDoctypeSystemIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.state = State.BOGUS_DOCTYPE;
|
|
|
|
this._stateBogusDoctype(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// DOCTYPE system identifier (double-quoted) state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateDoctypeSystemIdentifierDoubleQuoted(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.QUOTATION_MARK: {
|
|
|
|
this.state = State.AFTER_DOCTYPE_SYSTEM_IDENTIFIER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
token.systemId += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.abruptDoctypeSystemIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this.state = State.DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.systemId += String.fromCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// DOCTYPE system identifier (single-quoted) state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateDoctypeSystemIdentifierSingleQuoted(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.APOSTROPHE: {
|
|
|
|
this.state = State.AFTER_DOCTYPE_SYSTEM_IDENTIFIER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
token.systemId += unicode_js_1.REPLACEMENT_CHARACTER;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this._err(error_codes_js_1.ERR.abruptDoctypeSystemIdentifier);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this.state = State.DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
token.systemId += String.fromCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// After DOCTYPE system identifier state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAfterDoctypeSystemIdentifier(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.SPACE:
|
|
|
|
case unicode_js_1.CODE_POINTS.LINE_FEED:
|
|
|
|
case unicode_js_1.CODE_POINTS.TABULATION:
|
|
|
|
case unicode_js_1.CODE_POINTS.FORM_FEED: {
|
|
|
|
// Ignore whitespace
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this.state = State.DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInDoctype);
|
|
|
|
token.forceQuirks = true;
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedCharacterAfterDoctypeSystemIdentifier);
|
|
|
|
this.state = State.BOGUS_DOCTYPE;
|
|
|
|
this._stateBogusDoctype(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Bogus DOCTYPE state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateBogusDoctype(cp) {
|
|
|
|
const token = this.currentToken;
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this.state = State.DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.NULL: {
|
|
|
|
this._err(error_codes_js_1.ERR.unexpectedNullCharacter);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this.emitCurrentDoctype(token);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
// Do nothing
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// CDATA section state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCdataSection(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.RIGHT_SQUARE_BRACKET: {
|
|
|
|
this.state = State.CDATA_SECTION_BRACKET;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.EOF: {
|
|
|
|
this._err(error_codes_js_1.ERR.eofInCdata);
|
|
|
|
this._emitEOFToken();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._emitCodePoint(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// CDATA section bracket state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCdataSectionBracket(cp) {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.RIGHT_SQUARE_BRACKET) {
|
|
|
|
this.state = State.CDATA_SECTION_END;
|
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
this._emitChars(']');
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.CDATA_SECTION;
|
|
|
|
this._stateCdataSection(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// CDATA section end state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCdataSectionEnd(cp) {
|
|
|
|
switch (cp) {
|
|
|
|
case unicode_js_1.CODE_POINTS.GREATER_THAN_SIGN: {
|
|
|
|
this.state = State.DATA;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case unicode_js_1.CODE_POINTS.RIGHT_SQUARE_BRACKET: {
|
|
|
|
this._emitChars(']');
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
this._emitChars(']]');
|
|
|
|
this.state = State.CDATA_SECTION;
|
|
|
|
this._stateCdataSection(cp);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Character reference state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateCharacterReference(cp) {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.NUMBER_SIGN) {
|
|
|
|
this.state = State.NUMERIC_CHARACTER_REFERENCE;
|
|
|
|
}
|
|
|
|
else if (isAsciiAlphaNumeric(cp)) {
|
|
|
|
this.state = State.NAMED_CHARACTER_REFERENCE;
|
|
|
|
this._stateNamedCharacterReference(cp);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._flushCodePointConsumedAsCharacterReference(unicode_js_1.CODE_POINTS.AMPERSAND);
|
2020-12-18 22:06:30 +00:00
|
|
|
this._reconsumeInState(this.returnState);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// Named character reference state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateNamedCharacterReference(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
const matchResult = this._matchNamedCharacterReference(cp);
|
2022-05-17 01:25:05 +00:00
|
|
|
//NOTE: Matching can be abrupted by hibernation. In that case, match
|
2020-12-18 22:06:30 +00:00
|
|
|
//results are no longer valid and we will need to start over.
|
|
|
|
if (this._ensureHibernation()) {
|
2022-05-17 01:25:05 +00:00
|
|
|
// Stay in the state, try again.
|
|
|
|
}
|
|
|
|
else if (matchResult) {
|
|
|
|
for (let i = 0; i < matchResult.length; i++) {
|
|
|
|
this._flushCodePointConsumedAsCharacterReference(matchResult[i]);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
this.state = this.returnState;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._flushCodePointConsumedAsCharacterReference(unicode_js_1.CODE_POINTS.AMPERSAND);
|
|
|
|
this.state = State.AMBIGUOUS_AMPERSAND;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Ambiguos ampersand state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateAmbiguousAmpersand(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiAlphaNumeric(cp)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this._flushCodePointConsumedAsCharacterReference(cp);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.SEMICOLON) {
|
|
|
|
this._err(error_codes_js_1.ERR.unknownNamedCharacterReference);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
this._reconsumeInState(this.returnState);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// Numeric character reference state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateNumericCharacterReference(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.charRefCode = 0;
|
2022-05-17 01:25:05 +00:00
|
|
|
if (cp === unicode_js_1.CODE_POINTS.LATIN_SMALL_X || cp === unicode_js_1.CODE_POINTS.LATIN_CAPITAL_X) {
|
|
|
|
this.state = State.HEXADEMICAL_CHARACTER_REFERENCE_START;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this.state = State.DECIMAL_CHARACTER_REFERENCE_START;
|
|
|
|
this._stateDecimalCharacterReferenceStart(cp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Hexademical character reference start state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateHexademicalCharacterReferenceStart(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiHexDigit(cp)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.HEXADEMICAL_CHARACTER_REFERENCE;
|
|
|
|
this._stateHexademicalCharacterReference(cp);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._err(error_codes_js_1.ERR.absenceOfDigitsInNumericCharacterReference);
|
|
|
|
this._flushCodePointConsumedAsCharacterReference(unicode_js_1.CODE_POINTS.AMPERSAND);
|
|
|
|
this._flushCodePointConsumedAsCharacterReference(unicode_js_1.CODE_POINTS.NUMBER_SIGN);
|
|
|
|
this._unconsume(2);
|
|
|
|
this.state = this.returnState;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Decimal character reference start state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateDecimalCharacterReferenceStart(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiDigit(cp)) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.state = State.DECIMAL_CHARACTER_REFERENCE;
|
|
|
|
this._stateDecimalCharacterReference(cp);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._err(error_codes_js_1.ERR.absenceOfDigitsInNumericCharacterReference);
|
|
|
|
this._flushCodePointConsumedAsCharacterReference(unicode_js_1.CODE_POINTS.AMPERSAND);
|
|
|
|
this._flushCodePointConsumedAsCharacterReference(unicode_js_1.CODE_POINTS.NUMBER_SIGN);
|
2020-12-18 22:06:30 +00:00
|
|
|
this._reconsumeInState(this.returnState);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// Hexademical character reference state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateHexademicalCharacterReference(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiUpperHexDigit(cp)) {
|
|
|
|
this.charRefCode = this.charRefCode * 16 + cp - 0x37;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else if (isAsciiLowerHexDigit(cp)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.charRefCode = this.charRefCode * 16 + cp - 0x57;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else if (isAsciiDigit(cp)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.charRefCode = this.charRefCode * 16 + cp - 0x30;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else if (cp === unicode_js_1.CODE_POINTS.SEMICOLON) {
|
|
|
|
this.state = State.NUMERIC_CHARACTER_REFERENCE_END;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._err(error_codes_js_1.ERR.missingSemicolonAfterCharacterReference);
|
|
|
|
this.state = State.NUMERIC_CHARACTER_REFERENCE_END;
|
|
|
|
this._stateNumericCharacterReferenceEnd();
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Decimal character reference state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateDecimalCharacterReference(cp) {
|
2020-12-18 22:06:30 +00:00
|
|
|
if (isAsciiDigit(cp)) {
|
|
|
|
this.charRefCode = this.charRefCode * 10 + cp - 0x30;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else if (cp === unicode_js_1.CODE_POINTS.SEMICOLON) {
|
|
|
|
this.state = State.NUMERIC_CHARACTER_REFERENCE_END;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
this._err(error_codes_js_1.ERR.missingSemicolonAfterCharacterReference);
|
|
|
|
this.state = State.NUMERIC_CHARACTER_REFERENCE_END;
|
|
|
|
this._stateNumericCharacterReferenceEnd();
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// Numeric character reference end state
|
|
|
|
//------------------------------------------------------------------
|
2022-05-17 01:25:05 +00:00
|
|
|
_stateNumericCharacterReferenceEnd() {
|
|
|
|
if (this.charRefCode === unicode_js_1.CODE_POINTS.NULL) {
|
|
|
|
this._err(error_codes_js_1.ERR.nullCharacterReference);
|
|
|
|
this.charRefCode = unicode_js_1.CODE_POINTS.REPLACEMENT_CHARACTER;
|
|
|
|
}
|
|
|
|
else if (this.charRefCode > 1114111) {
|
|
|
|
this._err(error_codes_js_1.ERR.characterReferenceOutsideUnicodeRange);
|
|
|
|
this.charRefCode = unicode_js_1.CODE_POINTS.REPLACEMENT_CHARACTER;
|
|
|
|
}
|
|
|
|
else if ((0, unicode_js_1.isSurrogate)(this.charRefCode)) {
|
|
|
|
this._err(error_codes_js_1.ERR.surrogateCharacterReference);
|
|
|
|
this.charRefCode = unicode_js_1.CODE_POINTS.REPLACEMENT_CHARACTER;
|
|
|
|
}
|
|
|
|
else if ((0, unicode_js_1.isUndefinedCodePoint)(this.charRefCode)) {
|
|
|
|
this._err(error_codes_js_1.ERR.noncharacterCharacterReference);
|
|
|
|
}
|
|
|
|
else if ((0, unicode_js_1.isControlCodePoint)(this.charRefCode) || this.charRefCode === unicode_js_1.CODE_POINTS.CARRIAGE_RETURN) {
|
|
|
|
this._err(error_codes_js_1.ERR.controlCharacterReference);
|
|
|
|
const replacement = C1_CONTROLS_REFERENCE_REPLACEMENTS.get(this.charRefCode);
|
|
|
|
if (replacement !== undefined) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.charRefCode = replacement;
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this._flushCodePointConsumedAsCharacterReference(this.charRefCode);
|
2020-12-18 22:06:30 +00:00
|
|
|
this._reconsumeInState(this.returnState);
|
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
exports.Tokenizer = Tokenizer;
|
2020-12-18 22:06:30 +00:00
|
|
|
|
2022-05-17 01:25:05 +00:00
|
|
|
},{"../common/error-codes.js":2,"../common/html.js":4,"../common/token.js":5,"../common/unicode.js":6,"./preprocessor.js":13,"entities/lib/decode.js":15}],13:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.Preprocessor = void 0;
|
|
|
|
const unicode_js_1 = require("../common/unicode.js");
|
|
|
|
const error_codes_js_1 = require("../common/error-codes.js");
|
2020-12-18 22:06:30 +00:00
|
|
|
//Const
|
|
|
|
const DEFAULT_BUFFER_WATERLINE = 1 << 16;
|
|
|
|
//Preprocessor
|
|
|
|
//NOTE: HTML input preprocessing
|
|
|
|
//(see: http://www.whatwg.org/specs/web-apps/current-work/multipage/parsing.html#preprocessing-the-input-stream)
|
|
|
|
class Preprocessor {
|
2022-05-17 01:25:05 +00:00
|
|
|
constructor(handler) {
|
|
|
|
this.handler = handler;
|
|
|
|
this.html = '';
|
2020-12-18 22:06:30 +00:00
|
|
|
this.pos = -1;
|
2022-05-17 01:25:05 +00:00
|
|
|
// NOTE: Initial `lastGapPos` is -2, to ensure `col` on initialisation is 0
|
|
|
|
this.lastGapPos = -2;
|
2020-12-18 22:06:30 +00:00
|
|
|
this.gapStack = [];
|
|
|
|
this.skipNextNewLine = false;
|
|
|
|
this.lastChunkWritten = false;
|
|
|
|
this.endOfChunkHit = false;
|
|
|
|
this.bufferWaterline = DEFAULT_BUFFER_WATERLINE;
|
2022-05-17 01:25:05 +00:00
|
|
|
this.isEol = false;
|
|
|
|
this.lineStartPos = 0;
|
|
|
|
this.droppedBufferSize = 0;
|
|
|
|
this.line = 1;
|
|
|
|
//NOTE: avoid reporting errors twice on advance/retreat
|
|
|
|
this.lastErrOffset = -1;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
/** The column on the current line. If we just saw a gap (eg. a surrogate pair), return the index before. */
|
|
|
|
get col() {
|
|
|
|
return this.pos - this.lineStartPos + Number(this.lastGapPos !== this.pos);
|
|
|
|
}
|
|
|
|
get offset() {
|
|
|
|
return this.droppedBufferSize + this.pos;
|
|
|
|
}
|
|
|
|
getError(code) {
|
|
|
|
const { line, col, offset } = this;
|
|
|
|
return {
|
|
|
|
code,
|
|
|
|
startLine: line,
|
|
|
|
endLine: line,
|
|
|
|
startCol: col,
|
|
|
|
endCol: col,
|
|
|
|
startOffset: offset,
|
|
|
|
endOffset: offset,
|
|
|
|
};
|
|
|
|
}
|
|
|
|
_err(code) {
|
|
|
|
if (this.handler.onParseError && this.lastErrOffset !== this.offset) {
|
|
|
|
this.lastErrOffset = this.offset;
|
|
|
|
this.handler.onParseError(this.getError(code));
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
_addGap() {
|
|
|
|
this.gapStack.push(this.lastGapPos);
|
|
|
|
this.lastGapPos = this.pos;
|
|
|
|
}
|
|
|
|
_processSurrogate(cp) {
|
|
|
|
//NOTE: try to peek a surrogate pair
|
2022-05-17 01:25:05 +00:00
|
|
|
if (this.pos !== this.html.length - 1) {
|
2020-12-18 22:06:30 +00:00
|
|
|
const nextCp = this.html.charCodeAt(this.pos + 1);
|
2022-05-17 01:25:05 +00:00
|
|
|
if ((0, unicode_js_1.isSurrogatePair)(nextCp)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
//NOTE: we have a surrogate pair. Peek pair character and recalculate code point.
|
|
|
|
this.pos++;
|
2022-05-17 01:25:05 +00:00
|
|
|
//NOTE: add a gap that should be avoided during retreat
|
2020-12-18 22:06:30 +00:00
|
|
|
this._addGap();
|
2022-05-17 01:25:05 +00:00
|
|
|
return (0, unicode_js_1.getSurrogatePairCodePoint)(cp, nextCp);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
//NOTE: we are at the end of a chunk, therefore we can't infer the surrogate pair yet.
|
2020-12-18 22:06:30 +00:00
|
|
|
else if (!this.lastChunkWritten) {
|
|
|
|
this.endOfChunkHit = true;
|
2022-05-17 01:25:05 +00:00
|
|
|
return unicode_js_1.CODE_POINTS.EOF;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
//NOTE: isolated surrogate
|
2022-05-17 01:25:05 +00:00
|
|
|
this._err(error_codes_js_1.ERR.surrogateInInputStream);
|
2020-12-18 22:06:30 +00:00
|
|
|
return cp;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
willDropParsedChunk() {
|
|
|
|
return this.pos > this.bufferWaterline;
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
dropParsedChunk() {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (this.willDropParsedChunk()) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.html = this.html.substring(this.pos);
|
2022-05-17 01:25:05 +00:00
|
|
|
this.lineStartPos -= this.pos;
|
|
|
|
this.droppedBufferSize += this.pos;
|
2020-12-18 22:06:30 +00:00
|
|
|
this.pos = 0;
|
2022-05-17 01:25:05 +00:00
|
|
|
this.lastGapPos = -2;
|
|
|
|
this.gapStack.length = 0;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
write(chunk, isLastChunk) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if (this.html.length > 0) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.html += chunk;
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
else {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.html = chunk;
|
|
|
|
}
|
|
|
|
this.endOfChunkHit = false;
|
|
|
|
this.lastChunkWritten = isLastChunk;
|
|
|
|
}
|
|
|
|
insertHtmlAtCurrentPos(chunk) {
|
2022-05-17 01:25:05 +00:00
|
|
|
this.html = this.html.substring(0, this.pos + 1) + chunk + this.html.substring(this.pos + 1);
|
2020-12-18 22:06:30 +00:00
|
|
|
this.endOfChunkHit = false;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
startsWith(pattern, caseSensitive) {
|
|
|
|
// Check if our buffer has enough characters
|
|
|
|
if (this.pos + pattern.length > this.html.length) {
|
|
|
|
this.endOfChunkHit = !this.lastChunkWritten;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
if (caseSensitive) {
|
|
|
|
return this.html.startsWith(pattern, this.pos);
|
|
|
|
}
|
|
|
|
for (let i = 0; i < pattern.length; i++) {
|
|
|
|
const cp = this.html.charCodeAt(this.pos + i) | 0x20;
|
|
|
|
if (cp !== pattern.charCodeAt(i)) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
peek(offset) {
|
|
|
|
const pos = this.pos + offset;
|
|
|
|
if (pos >= this.html.length) {
|
|
|
|
this.endOfChunkHit = !this.lastChunkWritten;
|
|
|
|
return unicode_js_1.CODE_POINTS.EOF;
|
|
|
|
}
|
|
|
|
return this.html.charCodeAt(pos);
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
advance() {
|
|
|
|
this.pos++;
|
2022-05-17 01:25:05 +00:00
|
|
|
//NOTE: LF should be in the last column of the line
|
|
|
|
if (this.isEol) {
|
|
|
|
this.isEol = false;
|
|
|
|
this.line++;
|
|
|
|
this.lineStartPos = this.pos;
|
|
|
|
}
|
|
|
|
if (this.pos >= this.html.length) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.endOfChunkHit = !this.lastChunkWritten;
|
2022-05-17 01:25:05 +00:00
|
|
|
return unicode_js_1.CODE_POINTS.EOF;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
let cp = this.html.charCodeAt(this.pos);
|
|
|
|
//NOTE: all U+000D CARRIAGE RETURN (CR) characters must be converted to U+000A LINE FEED (LF) characters
|
2022-05-17 01:25:05 +00:00
|
|
|
if (cp === unicode_js_1.CODE_POINTS.CARRIAGE_RETURN) {
|
|
|
|
this.isEol = true;
|
2020-12-18 22:06:30 +00:00
|
|
|
this.skipNextNewLine = true;
|
2022-05-17 01:25:05 +00:00
|
|
|
return unicode_js_1.CODE_POINTS.LINE_FEED;
|
|
|
|
}
|
|
|
|
//NOTE: any U+000A LINE FEED (LF) characters that immediately follow a U+000D CARRIAGE RETURN (CR) character
|
|
|
|
//must be ignored.
|
|
|
|
if (cp === unicode_js_1.CODE_POINTS.LINE_FEED) {
|
|
|
|
this.isEol = true;
|
|
|
|
if (this.skipNextNewLine) {
|
|
|
|
// `line` will be bumped again in the recursive call.
|
|
|
|
this.line--;
|
|
|
|
this.skipNextNewLine = false;
|
|
|
|
this._addGap();
|
|
|
|
return this.advance();
|
|
|
|
}
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
this.skipNextNewLine = false;
|
2022-05-17 01:25:05 +00:00
|
|
|
if ((0, unicode_js_1.isSurrogate)(cp)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
cp = this._processSurrogate(cp);
|
|
|
|
}
|
|
|
|
//OPTIMIZATION: first check if code point is in the common allowed
|
|
|
|
//range (ASCII alphanumeric, whitespaces, big chunk of BMP)
|
|
|
|
//before going into detailed performance cost validation.
|
2022-05-17 01:25:05 +00:00
|
|
|
const isCommonValidRange = this.handler.onParseError === null ||
|
|
|
|
(cp > 0x1f && cp < 0x7f) ||
|
|
|
|
cp === unicode_js_1.CODE_POINTS.LINE_FEED ||
|
|
|
|
cp === unicode_js_1.CODE_POINTS.CARRIAGE_RETURN ||
|
|
|
|
(cp > 0x9f && cp < 64976);
|
2020-12-18 22:06:30 +00:00
|
|
|
if (!isCommonValidRange) {
|
|
|
|
this._checkForProblematicCharacters(cp);
|
|
|
|
}
|
|
|
|
return cp;
|
|
|
|
}
|
|
|
|
_checkForProblematicCharacters(cp) {
|
2022-05-17 01:25:05 +00:00
|
|
|
if ((0, unicode_js_1.isControlCodePoint)(cp)) {
|
|
|
|
this._err(error_codes_js_1.ERR.controlCharacterInInputStream);
|
|
|
|
}
|
|
|
|
else if ((0, unicode_js_1.isUndefinedCodePoint)(cp)) {
|
|
|
|
this._err(error_codes_js_1.ERR.noncharacterInInputStream);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
retreat(count) {
|
|
|
|
this.pos -= count;
|
|
|
|
while (this.pos < this.lastGapPos) {
|
2020-12-18 22:06:30 +00:00
|
|
|
this.lastGapPos = this.gapStack.pop();
|
|
|
|
this.pos--;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
this.isEol = false;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
exports.Preprocessor = Preprocessor;
|
|
|
|
|
|
|
|
},{"../common/error-codes.js":2,"../common/unicode.js":6}],14:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.defaultTreeAdapter = exports.NodeType = void 0;
|
|
|
|
const html_js_1 = require("../common/html.js");
|
|
|
|
var NodeType;
|
|
|
|
(function (NodeType) {
|
|
|
|
NodeType["Document"] = "#document";
|
|
|
|
NodeType["DocumentFragment"] = "#document-fragment";
|
|
|
|
NodeType["Comment"] = "#comment";
|
|
|
|
NodeType["Text"] = "#text";
|
|
|
|
NodeType["DocumentType"] = "#documentType";
|
|
|
|
})(NodeType = exports.NodeType || (exports.NodeType = {}));
|
|
|
|
function createTextNode(value) {
|
2020-12-18 22:06:30 +00:00
|
|
|
return {
|
2022-05-17 01:25:05 +00:00
|
|
|
nodeName: NodeType.Text,
|
|
|
|
value,
|
|
|
|
parentNode: null,
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
2022-05-17 01:25:05 +00:00
|
|
|
}
|
|
|
|
exports.defaultTreeAdapter = {
|
|
|
|
//Node construction
|
|
|
|
createDocument() {
|
|
|
|
return {
|
|
|
|
nodeName: NodeType.Document,
|
|
|
|
mode: html_js_1.DOCUMENT_MODE.NO_QUIRKS,
|
|
|
|
childNodes: [],
|
|
|
|
};
|
|
|
|
},
|
|
|
|
createDocumentFragment() {
|
|
|
|
return {
|
|
|
|
nodeName: NodeType.DocumentFragment,
|
|
|
|
childNodes: [],
|
|
|
|
};
|
|
|
|
},
|
|
|
|
createElement(tagName, namespaceURI, attrs) {
|
|
|
|
return {
|
|
|
|
nodeName: tagName,
|
|
|
|
tagName,
|
|
|
|
attrs,
|
|
|
|
namespaceURI,
|
|
|
|
childNodes: [],
|
|
|
|
parentNode: null,
|
|
|
|
};
|
|
|
|
},
|
|
|
|
createCommentNode(data) {
|
|
|
|
return {
|
|
|
|
nodeName: NodeType.Comment,
|
|
|
|
data,
|
|
|
|
parentNode: null,
|
|
|
|
};
|
|
|
|
},
|
|
|
|
//Tree mutation
|
|
|
|
appendChild(parentNode, newNode) {
|
|
|
|
parentNode.childNodes.push(newNode);
|
|
|
|
newNode.parentNode = parentNode;
|
|
|
|
},
|
|
|
|
insertBefore(parentNode, newNode, referenceNode) {
|
|
|
|
const insertionIdx = parentNode.childNodes.indexOf(referenceNode);
|
|
|
|
parentNode.childNodes.splice(insertionIdx, 0, newNode);
|
|
|
|
newNode.parentNode = parentNode;
|
|
|
|
},
|
|
|
|
setTemplateContent(templateElement, contentElement) {
|
|
|
|
templateElement.content = contentElement;
|
|
|
|
},
|
|
|
|
getTemplateContent(templateElement) {
|
|
|
|
return templateElement.content;
|
|
|
|
},
|
|
|
|
setDocumentType(document, name, publicId, systemId) {
|
|
|
|
const doctypeNode = document.childNodes.find((node) => node.nodeName === NodeType.DocumentType);
|
|
|
|
if (doctypeNode) {
|
|
|
|
doctypeNode.name = name;
|
|
|
|
doctypeNode.publicId = publicId;
|
|
|
|
doctypeNode.systemId = systemId;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
const node = {
|
|
|
|
nodeName: NodeType.DocumentType,
|
|
|
|
name,
|
|
|
|
publicId,
|
|
|
|
systemId,
|
|
|
|
parentNode: null,
|
|
|
|
};
|
|
|
|
exports.defaultTreeAdapter.appendChild(document, node);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
},
|
|
|
|
setDocumentMode(document, mode) {
|
|
|
|
document.mode = mode;
|
|
|
|
},
|
|
|
|
getDocumentMode(document) {
|
|
|
|
return document.mode;
|
|
|
|
},
|
|
|
|
detachNode(node) {
|
|
|
|
if (node.parentNode) {
|
|
|
|
const idx = node.parentNode.childNodes.indexOf(node);
|
|
|
|
node.parentNode.childNodes.splice(idx, 1);
|
|
|
|
node.parentNode = null;
|
|
|
|
}
|
|
|
|
},
|
|
|
|
insertText(parentNode, text) {
|
|
|
|
if (parentNode.childNodes.length > 0) {
|
|
|
|
const prevNode = parentNode.childNodes[parentNode.childNodes.length - 1];
|
|
|
|
if (exports.defaultTreeAdapter.isTextNode(prevNode)) {
|
|
|
|
prevNode.value += text;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
exports.defaultTreeAdapter.appendChild(parentNode, createTextNode(text));
|
|
|
|
},
|
|
|
|
insertTextBefore(parentNode, text, referenceNode) {
|
|
|
|
const prevNode = parentNode.childNodes[parentNode.childNodes.indexOf(referenceNode) - 1];
|
|
|
|
if (prevNode && exports.defaultTreeAdapter.isTextNode(prevNode)) {
|
2020-12-18 22:06:30 +00:00
|
|
|
prevNode.value += text;
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
else {
|
|
|
|
exports.defaultTreeAdapter.insertBefore(parentNode, createTextNode(text), referenceNode);
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
},
|
|
|
|
adoptAttributes(recipient, attrs) {
|
|
|
|
const recipientAttrsMap = new Set(recipient.attrs.map((attr) => attr.name));
|
|
|
|
for (let j = 0; j < attrs.length; j++) {
|
|
|
|
if (!recipientAttrsMap.has(attrs[j].name)) {
|
|
|
|
recipient.attrs.push(attrs[j]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
},
|
|
|
|
//Tree traversing
|
|
|
|
getFirstChild(node) {
|
|
|
|
return node.childNodes[0];
|
|
|
|
},
|
|
|
|
getChildNodes(node) {
|
|
|
|
return node.childNodes;
|
|
|
|
},
|
|
|
|
getParentNode(node) {
|
|
|
|
return node.parentNode;
|
|
|
|
},
|
|
|
|
getAttrList(element) {
|
|
|
|
return element.attrs;
|
|
|
|
},
|
|
|
|
//Node data
|
|
|
|
getTagName(element) {
|
|
|
|
return element.tagName;
|
|
|
|
},
|
|
|
|
getNamespaceURI(element) {
|
|
|
|
return element.namespaceURI;
|
|
|
|
},
|
|
|
|
getTextNodeContent(textNode) {
|
|
|
|
return textNode.value;
|
|
|
|
},
|
|
|
|
getCommentNodeContent(commentNode) {
|
|
|
|
return commentNode.data;
|
|
|
|
},
|
|
|
|
getDocumentTypeNodeName(doctypeNode) {
|
|
|
|
return doctypeNode.name;
|
|
|
|
},
|
|
|
|
getDocumentTypeNodePublicId(doctypeNode) {
|
|
|
|
return doctypeNode.publicId;
|
|
|
|
},
|
|
|
|
getDocumentTypeNodeSystemId(doctypeNode) {
|
|
|
|
return doctypeNode.systemId;
|
|
|
|
},
|
|
|
|
//Node types
|
|
|
|
isTextNode(node) {
|
|
|
|
return node.nodeName === '#text';
|
|
|
|
},
|
|
|
|
isCommentNode(node) {
|
|
|
|
return node.nodeName === '#comment';
|
|
|
|
},
|
|
|
|
isDocumentTypeNode(node) {
|
|
|
|
return node.nodeName === NodeType.DocumentType;
|
|
|
|
},
|
|
|
|
isElementNode(node) {
|
|
|
|
return Object.prototype.hasOwnProperty.call(node, 'tagName');
|
|
|
|
},
|
|
|
|
// Source code location
|
|
|
|
setNodeSourceCodeLocation(node, location) {
|
|
|
|
node.sourceCodeLocation = location;
|
|
|
|
},
|
|
|
|
getNodeSourceCodeLocation(node) {
|
|
|
|
return node.sourceCodeLocation;
|
|
|
|
},
|
|
|
|
updateNodeSourceCodeLocation(node, endLocation) {
|
|
|
|
node.sourceCodeLocation = Object.assign(Object.assign({}, node.sourceCodeLocation), endLocation);
|
|
|
|
},
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
|
|
|
|
2022-05-17 01:25:05 +00:00
|
|
|
},{"../common/html.js":4}],15:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
var __importDefault = (this && this.__importDefault) || function (mod) {
|
|
|
|
return (mod && mod.__esModule) ? mod : { "default": mod };
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
2022-05-17 01:25:05 +00:00
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.decodeXML = exports.decodeHTMLStrict = exports.decodeHTML = exports.determineBranch = exports.BinTrieFlags = exports.fromCodePoint = exports.replaceCodePoint = exports.decodeCodePoint = exports.xmlDecodeTree = exports.htmlDecodeTree = void 0;
|
|
|
|
var decode_data_html_js_1 = __importDefault(require("./generated/decode-data-html.js"));
|
|
|
|
exports.htmlDecodeTree = decode_data_html_js_1.default;
|
|
|
|
var decode_data_xml_js_1 = __importDefault(require("./generated/decode-data-xml.js"));
|
|
|
|
exports.xmlDecodeTree = decode_data_xml_js_1.default;
|
|
|
|
var decode_codepoint_js_1 = __importDefault(require("./decode_codepoint.js"));
|
|
|
|
exports.decodeCodePoint = decode_codepoint_js_1.default;
|
|
|
|
var decode_codepoint_js_2 = require("./decode_codepoint.js");
|
|
|
|
Object.defineProperty(exports, "replaceCodePoint", { enumerable: true, get: function () { return decode_codepoint_js_2.replaceCodePoint; } });
|
|
|
|
Object.defineProperty(exports, "fromCodePoint", { enumerable: true, get: function () { return decode_codepoint_js_2.fromCodePoint; } });
|
|
|
|
var CharCodes;
|
|
|
|
(function (CharCodes) {
|
|
|
|
CharCodes[CharCodes["NUM"] = 35] = "NUM";
|
|
|
|
CharCodes[CharCodes["SEMI"] = 59] = "SEMI";
|
|
|
|
CharCodes[CharCodes["ZERO"] = 48] = "ZERO";
|
|
|
|
CharCodes[CharCodes["NINE"] = 57] = "NINE";
|
|
|
|
CharCodes[CharCodes["LOWER_A"] = 97] = "LOWER_A";
|
|
|
|
CharCodes[CharCodes["LOWER_F"] = 102] = "LOWER_F";
|
|
|
|
CharCodes[CharCodes["LOWER_X"] = 120] = "LOWER_X";
|
|
|
|
/** Bit that needs to be set to convert an upper case ASCII character to lower case */
|
|
|
|
CharCodes[CharCodes["To_LOWER_BIT"] = 32] = "To_LOWER_BIT";
|
|
|
|
})(CharCodes || (CharCodes = {}));
|
|
|
|
var BinTrieFlags;
|
|
|
|
(function (BinTrieFlags) {
|
|
|
|
BinTrieFlags[BinTrieFlags["VALUE_LENGTH"] = 49152] = "VALUE_LENGTH";
|
|
|
|
BinTrieFlags[BinTrieFlags["BRANCH_LENGTH"] = 16256] = "BRANCH_LENGTH";
|
|
|
|
BinTrieFlags[BinTrieFlags["JUMP_TABLE"] = 127] = "JUMP_TABLE";
|
|
|
|
})(BinTrieFlags = exports.BinTrieFlags || (exports.BinTrieFlags = {}));
|
|
|
|
function getDecoder(decodeTree) {
|
|
|
|
return function decodeHTMLBinary(str, strict) {
|
|
|
|
var ret = "";
|
|
|
|
var lastIdx = 0;
|
|
|
|
var strIdx = 0;
|
|
|
|
while ((strIdx = str.indexOf("&", strIdx)) >= 0) {
|
|
|
|
ret += str.slice(lastIdx, strIdx);
|
|
|
|
lastIdx = strIdx;
|
|
|
|
// Skip the "&"
|
|
|
|
strIdx += 1;
|
|
|
|
// If we have a numeric entity, handle this separately.
|
|
|
|
if (str.charCodeAt(strIdx) === CharCodes.NUM) {
|
|
|
|
// Skip the leading "&#". For hex entities, also skip the leading "x".
|
|
|
|
var start = strIdx + 1;
|
|
|
|
var base = 10;
|
|
|
|
var cp = str.charCodeAt(start);
|
|
|
|
if ((cp | CharCodes.To_LOWER_BIT) === CharCodes.LOWER_X) {
|
|
|
|
base = 16;
|
|
|
|
strIdx += 1;
|
|
|
|
start += 1;
|
|
|
|
}
|
|
|
|
do
|
|
|
|
cp = str.charCodeAt(++strIdx);
|
|
|
|
while ((cp >= CharCodes.ZERO && cp <= CharCodes.NINE) ||
|
|
|
|
(base === 16 &&
|
|
|
|
(cp | CharCodes.To_LOWER_BIT) >= CharCodes.LOWER_A &&
|
|
|
|
(cp | CharCodes.To_LOWER_BIT) <= CharCodes.LOWER_F));
|
|
|
|
if (start !== strIdx) {
|
|
|
|
var entity = str.substring(start, strIdx);
|
|
|
|
var parsed = parseInt(entity, base);
|
|
|
|
if (str.charCodeAt(strIdx) === CharCodes.SEMI) {
|
|
|
|
strIdx += 1;
|
|
|
|
}
|
|
|
|
else if (strict) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
ret += (0, decode_codepoint_js_1.default)(parsed);
|
|
|
|
lastIdx = strIdx;
|
|
|
|
}
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
var resultIdx = 0;
|
|
|
|
var excess = 1;
|
|
|
|
var treeIdx = 0;
|
|
|
|
var current = decodeTree[treeIdx];
|
|
|
|
for (; strIdx < str.length; strIdx++, excess++) {
|
|
|
|
treeIdx = determineBranch(decodeTree, current, treeIdx + 1, str.charCodeAt(strIdx));
|
|
|
|
if (treeIdx < 0)
|
|
|
|
break;
|
|
|
|
current = decodeTree[treeIdx];
|
|
|
|
var masked = current & BinTrieFlags.VALUE_LENGTH;
|
|
|
|
// If the branch is a value, store it and continue
|
|
|
|
if (masked) {
|
|
|
|
// If we have a legacy entity while parsing strictly, just skip the number of bytes
|
|
|
|
if (!strict || str.charCodeAt(strIdx) === CharCodes.SEMI) {
|
|
|
|
resultIdx = treeIdx;
|
|
|
|
excess = 0;
|
|
|
|
}
|
|
|
|
// The mask is the number of bytes of the value, including the current byte.
|
|
|
|
var valueLength = (masked >> 14) - 1;
|
|
|
|
if (valueLength === 0)
|
|
|
|
break;
|
|
|
|
treeIdx += valueLength;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (resultIdx !== 0) {
|
|
|
|
var valueLength = (decodeTree[resultIdx] & BinTrieFlags.VALUE_LENGTH) >> 14;
|
|
|
|
ret +=
|
|
|
|
valueLength === 1
|
|
|
|
? String.fromCharCode(decodeTree[resultIdx] & ~BinTrieFlags.VALUE_LENGTH)
|
|
|
|
: valueLength === 2
|
|
|
|
? String.fromCharCode(decodeTree[resultIdx + 1])
|
|
|
|
: String.fromCharCode(decodeTree[resultIdx + 1], decodeTree[resultIdx + 2]);
|
|
|
|
lastIdx = strIdx - excess + 1;
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
return ret + str.slice(lastIdx);
|
|
|
|
};
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
function determineBranch(decodeTree, current, nodeIdx, char) {
|
|
|
|
var branchCount = (current & BinTrieFlags.BRANCH_LENGTH) >> 7;
|
|
|
|
var jumpOffset = current & BinTrieFlags.JUMP_TABLE;
|
|
|
|
// Case 1: Single branch encoded in jump offset
|
|
|
|
if (branchCount === 0) {
|
|
|
|
return jumpOffset !== 0 && char === jumpOffset ? nodeIdx : -1;
|
|
|
|
}
|
|
|
|
// Case 2: Multiple branches encoded in jump table
|
|
|
|
if (jumpOffset) {
|
|
|
|
var value = char - jumpOffset;
|
|
|
|
return value < 0 || value > branchCount
|
|
|
|
? -1
|
|
|
|
: decodeTree[nodeIdx + value] - 1;
|
|
|
|
}
|
|
|
|
// Case 3: Multiple branches encoded in dictionary
|
|
|
|
// Binary search for the character.
|
|
|
|
var lo = nodeIdx;
|
|
|
|
var hi = lo + branchCount - 1;
|
|
|
|
while (lo <= hi) {
|
|
|
|
var mid = (lo + hi) >>> 1;
|
|
|
|
var midVal = decodeTree[mid];
|
|
|
|
if (midVal < char) {
|
|
|
|
lo = mid + 1;
|
|
|
|
}
|
|
|
|
else if (midVal > char) {
|
|
|
|
hi = mid - 1;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
return decodeTree[mid + branchCount];
|
2020-12-18 22:06:30 +00:00
|
|
|
}
|
|
|
|
}
|
2022-05-17 01:25:05 +00:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
exports.determineBranch = determineBranch;
|
|
|
|
var htmlDecoder = getDecoder(decode_data_html_js_1.default);
|
|
|
|
var xmlDecoder = getDecoder(decode_data_xml_js_1.default);
|
|
|
|
function decodeHTML(str) {
|
|
|
|
return htmlDecoder(str, false);
|
|
|
|
}
|
|
|
|
exports.decodeHTML = decodeHTML;
|
|
|
|
function decodeHTMLStrict(str) {
|
|
|
|
return htmlDecoder(str, true);
|
|
|
|
}
|
|
|
|
exports.decodeHTMLStrict = decodeHTMLStrict;
|
|
|
|
function decodeXML(str) {
|
|
|
|
return xmlDecoder(str, true);
|
|
|
|
}
|
|
|
|
exports.decodeXML = decodeXML;
|
|
|
|
|
|
|
|
},{"./decode_codepoint.js":16,"./generated/decode-data-html.js":18,"./generated/decode-data-xml.js":19}],16:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
// Adapted from https://github.com/mathiasbynens/he/blob/36afe179392226cf1b6ccdb16ebbb7a5a844d93a/src/he.js#L106-L134
|
|
|
|
var _a;
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.replaceCodePoint = exports.fromCodePoint = void 0;
|
|
|
|
var decodeMap = new Map([
|
|
|
|
[0, 65533],
|
|
|
|
[128, 8364],
|
|
|
|
[130, 8218],
|
|
|
|
[131, 402],
|
|
|
|
[132, 8222],
|
|
|
|
[133, 8230],
|
|
|
|
[134, 8224],
|
|
|
|
[135, 8225],
|
|
|
|
[136, 710],
|
|
|
|
[137, 8240],
|
|
|
|
[138, 352],
|
|
|
|
[139, 8249],
|
|
|
|
[140, 338],
|
|
|
|
[142, 381],
|
|
|
|
[145, 8216],
|
|
|
|
[146, 8217],
|
|
|
|
[147, 8220],
|
|
|
|
[148, 8221],
|
|
|
|
[149, 8226],
|
|
|
|
[150, 8211],
|
|
|
|
[151, 8212],
|
|
|
|
[152, 732],
|
|
|
|
[153, 8482],
|
|
|
|
[154, 353],
|
|
|
|
[155, 8250],
|
|
|
|
[156, 339],
|
|
|
|
[158, 382],
|
|
|
|
[159, 376],
|
|
|
|
]);
|
|
|
|
exports.fromCodePoint =
|
|
|
|
// eslint-disable-next-line @typescript-eslint/no-unnecessary-condition, node/no-unsupported-features/es-builtins
|
|
|
|
(_a = String.fromCodePoint) !== null && _a !== void 0 ? _a : function (codePoint) {
|
|
|
|
var output = "";
|
|
|
|
if (codePoint > 0xffff) {
|
|
|
|
codePoint -= 0x10000;
|
|
|
|
output += String.fromCharCode(((codePoint >>> 10) & 0x3ff) | 0xd800);
|
|
|
|
codePoint = 0xdc00 | (codePoint & 0x3ff);
|
|
|
|
}
|
|
|
|
output += String.fromCharCode(codePoint);
|
|
|
|
return output;
|
2020-12-18 22:06:30 +00:00
|
|
|
};
|
2022-05-17 01:25:05 +00:00
|
|
|
function replaceCodePoint(codePoint) {
|
|
|
|
var _a;
|
|
|
|
if ((codePoint >= 0xd800 && codePoint <= 0xdfff) || codePoint > 0x10ffff) {
|
|
|
|
return 0xfffd;
|
|
|
|
}
|
|
|
|
return (_a = decodeMap.get(codePoint)) !== null && _a !== void 0 ? _a : codePoint;
|
|
|
|
}
|
|
|
|
exports.replaceCodePoint = replaceCodePoint;
|
|
|
|
function decodeCodePoint(codePoint) {
|
|
|
|
return (0, exports.fromCodePoint)(replaceCodePoint(codePoint));
|
|
|
|
}
|
|
|
|
exports.default = decodeCodePoint;
|
|
|
|
|
|
|
|
},{}],17:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
exports.escapeText = exports.escapeAttribute = exports.escapeUTF8 = exports.escape = exports.encodeXML = exports.getCodePoint = exports.xmlReplacer = void 0;
|
|
|
|
exports.xmlReplacer = /["&'<>$\x80-\uFFFF]/g;
|
|
|
|
var xmlCodeMap = new Map([
|
|
|
|
[34, """],
|
|
|
|
[38, "&"],
|
|
|
|
[39, "'"],
|
|
|
|
[60, "<"],
|
|
|
|
[62, ">"],
|
|
|
|
]);
|
|
|
|
// For compatibility with node < 4, we wrap `codePointAt`
|
|
|
|
exports.getCodePoint =
|
|
|
|
// eslint-disable-next-line @typescript-eslint/no-unnecessary-condition
|
|
|
|
String.prototype.codePointAt != null
|
|
|
|
? function (str, index) { return str.codePointAt(index); }
|
|
|
|
: // http://mathiasbynens.be/notes/javascript-encoding#surrogate-formulae
|
|
|
|
function (c, index) {
|
|
|
|
return (c.charCodeAt(index) & 0xfc00) === 0xd800
|
|
|
|
? (c.charCodeAt(index) - 0xd800) * 0x400 +
|
|
|
|
c.charCodeAt(index + 1) -
|
|
|
|
0xdc00 +
|
|
|
|
0x10000
|
|
|
|
: c.charCodeAt(index);
|
|
|
|
};
|
|
|
|
/**
|
|
|
|
* Encodes all non-ASCII characters, as well as characters not valid in XML
|
|
|
|
* documents using XML entities.
|
|
|
|
*
|
|
|
|
* If a character has no equivalent entity, a
|
|
|
|
* numeric hexadecimal reference (eg. `ü`) will be used.
|
|
|
|
*/
|
|
|
|
function encodeXML(str) {
|
|
|
|
var ret = "";
|
|
|
|
var lastIdx = 0;
|
|
|
|
var match;
|
|
|
|
while ((match = exports.xmlReplacer.exec(str)) !== null) {
|
|
|
|
var i = match.index;
|
|
|
|
var char = str.charCodeAt(i);
|
|
|
|
var next = xmlCodeMap.get(char);
|
|
|
|
if (next !== undefined) {
|
|
|
|
ret += str.substring(lastIdx, i) + next;
|
|
|
|
lastIdx = i + 1;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
ret += "".concat(str.substring(lastIdx, i), "&#x").concat((0, exports.getCodePoint)(str, i).toString(16), ";");
|
|
|
|
// Increase by 1 if we have a surrogate pair
|
|
|
|
lastIdx = exports.xmlReplacer.lastIndex += Number((char & 0xfc00) === 0xd800);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return ret + str.substr(lastIdx);
|
|
|
|
}
|
|
|
|
exports.encodeXML = encodeXML;
|
|
|
|
/**
|
|
|
|
* Encodes all non-ASCII characters, as well as characters not valid in XML
|
|
|
|
* documents using numeric hexadecimal reference (eg. `ü`).
|
|
|
|
*
|
|
|
|
* Have a look at `escapeUTF8` if you want a more concise output at the expense
|
|
|
|
* of reduced transportability.
|
|
|
|
*
|
|
|
|
* @param data String to escape.
|
|
|
|
*/
|
|
|
|
exports.escape = encodeXML;
|
|
|
|
function getEscaper(regex, map) {
|
|
|
|
return function escape(data) {
|
|
|
|
var match;
|
|
|
|
var lastIdx = 0;
|
|
|
|
var result = "";
|
|
|
|
while ((match = regex.exec(data))) {
|
|
|
|
if (lastIdx !== match.index) {
|
|
|
|
result += data.substring(lastIdx, match.index);
|
|
|
|
}
|
|
|
|
// We know that this chararcter will be in the map.
|
|
|
|
result += map.get(match[0].charCodeAt(0));
|
|
|
|
// Every match will be of length 1
|
|
|
|
lastIdx = match.index + 1;
|
|
|
|
}
|
|
|
|
return result + data.substring(lastIdx);
|
|
|
|
};
|
|
|
|
}
|
|
|
|
/**
|
|
|
|
* Encodes all characters not valid in XML documents using XML entities.
|
|
|
|
*
|
|
|
|
* Note that the output will be character-set dependent.
|
|
|
|
*
|
|
|
|
* @param data String to escape.
|
|
|
|
*/
|
|
|
|
exports.escapeUTF8 = getEscaper(/[&<>'"]/g, xmlCodeMap);
|
|
|
|
/**
|
|
|
|
* Encodes all characters that have to be escaped in HTML attributes,
|
|
|
|
* following {@link https://html.spec.whatwg.org/multipage/parsing.html#escapingString}.
|
|
|
|
*
|
|
|
|
* @param data String to escape.
|
|
|
|
*/
|
|
|
|
exports.escapeAttribute = getEscaper(/["&\u00A0]/g, new Map([
|
|
|
|
[34, """],
|
|
|
|
[38, "&"],
|
|
|
|
[160, " "],
|
|
|
|
]));
|
|
|
|
/**
|
|
|
|
* Encodes all characters that have to be escaped in HTML text,
|
|
|
|
* following {@link https://html.spec.whatwg.org/multipage/parsing.html#escapingString}.
|
|
|
|
*
|
|
|
|
* @param data String to escape.
|
|
|
|
*/
|
|
|
|
exports.escapeText = getEscaper(/[&<>\u00A0]/g, new Map([
|
|
|
|
[38, "&"],
|
|
|
|
[60, "<"],
|
|
|
|
[62, ">"],
|
|
|
|
[160, " "],
|
|
|
|
]));
|
|
|
|
|
|
|
|
},{}],18:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
// Generated using scripts/write-decode-map.ts
|
|
|
|
// prettier-ignore
|
|
|
|
exports.default = new Uint16Array([7489, 60, 213, 305, 650, 1181, 1403, 1488, 1653, 1758, 1954, 2006, 2063, 2634, 2705, 3489, 3693, 3849, 3878, 4298, 4648, 4833, 5141, 5277, 5315, 5343, 5413, 0, 0, 0, 0, 0, 0, 5483, 5837, 6541, 7186, 7645, 8062, 8288, 8624, 8845, 9152, 9211, 9282, 10276, 10514, 11528, 11848, 12238, 12310, 12986, 13881, 14252, 14590, 14888, 14961, 15072, 15150, 2048, 69, 77, 97, 98, 99, 102, 103, 108, 109, 110, 111, 112, 114, 115, 116, 117, 92, 98, 102, 109, 115, 127, 132, 139, 144, 149, 152, 166, 179, 185, 200, 207, 108, 105, 103, 32827, 198, 16582, 80, 32827, 38, 16422, 99, 117, 116, 101, 32827, 193, 16577, 114, 101, 118, 101, 59, 16642, 256, 105, 121, 120, 125, 114, 99, 32827, 194, 16578, 59, 17424, 114, 59, 49152, 55349, 56580, 114, 97, 118, 101, 32827, 192, 16576, 112, 104, 97, 59, 17297, 97, 99, 114, 59, 16640, 100, 59, 27219, 256, 103, 112, 157, 161, 111, 110, 59, 16644, 102, 59, 49152, 55349, 56632, 112, 108, 121, 70, 117, 110, 99, 116, 105, 111, 110, 59, 24673, 105, 110, 103, 32827, 197, 16581, 256, 99, 115, 190, 195, 114, 59, 49152, 55349, 56476, 105, 103, 110, 59, 25172, 105, 108, 100, 101, 32827, 195, 16579, 109, 108, 32827, 196, 16580, 1024, 97, 99, 101, 102, 111, 114, 115, 117, 229, 251, 254, 279, 284, 290, 295, 298, 256, 99, 114, 234, 242, 107, 115, 108, 97, 115, 104, 59, 25110, 374, 246, 248, 59, 27367, 101, 100, 59, 25350, 121, 59, 17425, 384, 99, 114, 116, 261, 267, 276, 97, 117, 115, 101, 59, 25141, 110, 111, 117, 108, 108, 105, 115, 59, 24876, 97, 59, 17298, 114, 59, 49152, 55349, 56581, 112, 102, 59, 49152, 55349, 56633, 101, 118, 101, 59, 17112, 99, 242, 275, 109, 112, 101, 113, 59, 25166, 1792, 72, 79, 97, 99, 100, 101, 102, 104, 105, 108, 111, 114, 115, 117, 333, 337, 342, 384, 414, 418, 437, 439, 442, 476, 533, 627, 632, 638, 99, 121, 59, 17447, 80, 89, 32827, 169, 16553, 384, 99, 112, 121, 349, 354, 378, 117, 116, 101, 59, 16646, 256, 59, 105, 359, 360, 25298, 116, 97, 108, 68, 105, 102, 102, 101, 114, 101, 110, 116, 105, 97, 108, 68, 59, 24901, 108, 101, 121, 115, 59, 24877, 512, 97, 101, 105, 111, 393, 398, 404, 408, 114, 111, 110, 59, 16652, 100, 105, 108, 32827, 199, 16583, 114, 99, 59, 16648, 110, 105, 110, 116, 59, 25136, 111, 116, 59, 16650, 256, 100, 110, 423, 429, 105, 108, 108, 97, 59, 16568, 116, 101, 114, 68, 111, 116, 59, 16567, 242, 383, 105, 59, 17319, 114, 99, 108, 101, 512, 68, 77, 80, 84, 455, 459, 465, 470, 111, 116, 59, 25241, 105, 110, 117, 115, 59, 25238, 108, 117, 115, 59, 25237, 105, 109, 101, 115, 59, 25239, 111, 256, 99, 115, 482, 504, 107, 119, 105, 115, 101, 67, 111, 110, 116, 111, 117, 114, 73, 110, 116, 101, 103, 114, 97, 108, 59, 25138, 101, 67, 117, 114, 108, 121, 256, 68, 81, 515, 527, 111, 117, 98, 108, 101, 81, 117, 111, 116, 101, 59, 24605, 117, 111, 116, 101, 59, 24601, 512, 108, 110, 112, 117, 542, 552, 583, 597, 111, 110, 256, 59, 101, 549, 550, 25143, 59, 27252, 384, 103, 105, 116, 559, 566, 570, 114, 117, 101, 110, 116, 59, 25185, 110, 116, 59, 25135, 111, 117, 114, 73, 110, 116, 101, 103, 114, 97, 108, 59, 25134, 256, 102, 114, 588, 590, 59, 24834, 111, 100, 117, 99, 116, 59, 25104, 110, 116, 101, 114, 67, 108, 111, 99, 107, 119, 105, 115, 101, 67, 111, 110, 116, 111, 117, 114, 73, 110, 116, 101, 103, 114, 97, 108, 59, 25139, 111, 115, 115, 59, 27183, 99, 114, 59, 49152, 55349, 56478, 112, 256, 59, 67, 644, 645, 25299, 97, 112, 59, 25165, 1408, 68, 74, 83, 90, 97, 99, 101, 102, 105, 111, 115, 672, 684, 688, 692, 696, 715, 727, 737, 742, 819, 1165, 256, 59, 111, 377, 677, 116, 114, 97, 104, 100, 59, 26897, 99, 121, 59, 17410, 99, 121, 59, 17413, 99, 121, 59, 17423, 384, 103, 114, 115, 703, 708, 711, 103, 101, 114, 59, 24609, 114, 59, 24993, 104, 118, 59, 27364, 256, 97, 121, 720, 725, 114, 111, 110, 59, 16654, 59, 17428, 108, 256, 59, 116, 733, 734, 25095, 97, 59, 17300, 114, 59, 49152, 55349, 56583, 256, 97, 102, 747, 807, 256, 99, 109, 752, 802, 114, 105, 116, 105, 99, 97, 108, 512, 65, 68, 71, 84, 768, 774, 790, 796, 99, 117, 116, 101, 59, 16564, 111, 372, 779, 781, 59, 17113, 98, 108, 101, 65, 99, 117, 116, 101, 59, 17117, 114, 97, 11
|
|
|
|
|
|
|
|
},{}],19:[function(require,module,exports){
|
|
|
|
"use strict";
|
|
|
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
|
// Generated using scripts/write-decode-map.ts
|
|
|
|
// prettier-ignore
|
|
|
|
exports.default = new Uint16Array([512, 97, 103, 108, 113, 9, 21, 24, 27, 621, 15, 0, 0, 18, 112, 59, 16422, 111, 115, 59, 16423, 116, 59, 16446, 116, 59, 16444, 117, 111, 116, 59, 16418]);
|
|
|
|
|
|
|
|
},{}]},{},[7])(7)
|
2020-12-18 22:06:30 +00:00
|
|
|
});
|
|
|
|
|
2022-05-17 01:25:05 +00:00
|
|
|
//# sourceMappingURL=data:application/json;charset=utf-8;base64,eyJ2ZXJzaW9uIjozLCJzb3VyY2VzIjpbIi4uLy4uLy4uL2Jyb3dzZXItcGFjay9fcHJlbHVkZS5qcyIsImNvbW1vbi9kb2N0eXBlLmpzIiwiY29tbW9uL2Vycm9yLWNvZGVzLmpzIiwiY29tbW9uL2ZvcmVpZ24tY29udGVudC5qcyIsImNvbW1vbi9odG1sLmpzIiwiY29tbW9uL3Rva2VuLmpzIiwiY29tbW9uL3VuaWNvZGUuanMiLCJpbmRleC5qcyIsInBhcnNlci9mb3JtYXR0aW5nLWVsZW1lbnQtbGlzdC5qcyIsInBhcnNlci9pbmRleC5qcyIsInBhcnNlci9vcGVuLWVsZW1lbnQtc3RhY2suanMiLCJzZXJpYWxpemVyL2luZGV4LmpzIiwidG9rZW5pemVyL2luZGV4LmpzIiwidG9rZW5pemVyL3ByZXByb2Nlc3Nvci5qcyIsInRyZWUtYWRhcHRlcnMvZGVmYXVsdC5qcyIsIi4uLy4uL25vZGVfbW9kdWxlcy9lbnRpdGllcy9saWIvZGVjb2RlLmpzIiwiLi4vLi4vbm9kZV9tb2R1bGVzL2VudGl0aWVzL2xpYi9kZWNvZGVfY29kZXBvaW50LmpzIiwiLi4vLi4vbm9kZV9tb2R1bGVzL2VudGl0aWVzL2xpYi9lc2NhcGUuanMiLCIuLi8uLi9ub2RlX21vZHVsZXMvZW50aXRpZXMvbGliL2dlbmVyYXRlZC9kZWNvZGUtZGF0YS1odG1sLmpzIiwiLi4vLi4vbm9kZV9tb2R1bGVzL2VudGl0aWVzL2xpYi9nZW5lcmF0ZWQvZGVjb2RlLWRhdGEteG1sLmpzIl0sIm5hbWVzIjpbXSwibWFwcGluZ3MiOiJBQUFBO0FDQUE7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBOztBQ3ZIQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTs7QUNsRUE7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTs7QUM5T0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUNBO0FBQ0E7QUFDQTtBQUN
|