'use strict'; Object.defineProperty(exports, '__esModule', { value: true }); var CleanCSS = require('clean-css'); var entities = require('entities'); var RelateURL = require('relateurl'); var terser = require('terser'); async function replaceAsync(str, regex, asyncFn) { const promises = []; str.replace(regex, (match, ...args) => { const promise = asyncFn(match, ...args); promises.push(promise); }); const data = await Promise.all(promises); return str.replace(regex, () => data.shift()); } /*! * HTML Parser By John Resig (ejohn.org) * Modified by Juriy "kangax" Zaytsev * Original code by Erik Arvidsson, Mozilla Public License * http://erik.eae.net/simplehtmlparser/simplehtmlparser.js */ class CaseInsensitiveSet extends Set { has(str) { return super.has(str.toLowerCase()); } } // Regular Expressions for parsing tags and attributes const singleAttrIdentifier = /([^\s"'<>/=]+)/; const singleAttrAssigns = [/=/]; const singleAttrValues = [ // attr value double quotes /"([^"]*)"+/.source, // attr value, single quotes /'([^']*)'+/.source, // attr value, no quotes /([^ \t\n\f\r"'`=<>]+)/.source ]; // https://www.w3.org/TR/1999/REC-xml-names-19990114/#NT-QName const qnameCapture = (function () { // based on https://www.npmjs.com/package/ncname const combiningChar = '\\u0300-\\u0345\\u0360\\u0361\\u0483-\\u0486\\u0591-\\u05A1\\u05A3-\\u05B9\\u05BB-\\u05BD\\u05BF\\u05C1\\u05C2\\u05C4\\u064B-\\u0652\\u0670\\u06D6-\\u06E4\\u06E7\\u06E8\\u06EA-\\u06ED\\u0901-\\u0903\\u093C\\u093E-\\u094D\\u0951-\\u0954\\u0962\\u0963\\u0981-\\u0983\\u09BC\\u09BE-\\u09C4\\u09C7\\u09C8\\u09CB-\\u09CD\\u09D7\\u09E2\\u09E3\\u0A02\\u0A3C\\u0A3E-\\u0A42\\u0A47\\u0A48\\u0A4B-\\u0A4D\\u0A70\\u0A71\\u0A81-\\u0A83\\u0ABC\\u0ABE-\\u0AC5\\u0AC7-\\u0AC9\\u0ACB-\\u0ACD\\u0B01-\\u0B03\\u0B3C\\u0B3E-\\u0B43\\u0B47\\u0B48\\u0B4B-\\u0B4D\\u0B56\\u0B57\\u0B82\\u0B83\\u0BBE-\\u0BC2\\u0BC6-\\u0BC8\\u0BCA-\\u0BCD\\u0BD7\\u0C01-\\u0C03\\u0C3E-\\u0C44\\u0C46-\\u0C48\\u0C4A-\\u0C4D\\u0C55\\u0C56\\u0C82\\u0C83\\u0CBE-\\u0CC4\\u0CC6-\\u0CC8\\u0CCA-\\u0CCD\\u0CD5\\u0CD6\\u0D02\\u0D03\\u0D3E-\\u0D43\\u0D46-\\u0D48\\u0D4A-\\u0D4D\\u0D57\\u0E31\\u0E34-\\u0E3A\\u0E47-\\u0E4E\\u0EB1\\u0EB4-\\u0EB9\\u0EBB\\u0EBC\\u0EC8-\\u0ECD\\u0F18\\u0F19\\u0F35\\u0F37\\u0F39\\u0F3E\\u0F3F\\u0F71-\\u0F84\\u0F86-\\u0F8B\\u0F90-\\u0F95\\u0F97\\u0F99-\\u0FAD\\u0FB1-\\u0FB7\\u0FB9\\u20D0-\\u20DC\\u20E1\\u302A-\\u302F\\u3099\\u309A'; const digit = '0-9\\u0660-\\u0669\\u06F0-\\u06F9\\u0966-\\u096F\\u09E6-\\u09EF\\u0A66-\\u0A6F\\u0AE6-\\u0AEF\\u0B66-\\u0B6F\\u0BE7-\\u0BEF\\u0C66-\\u0C6F\\u0CE6-\\u0CEF\\u0D66-\\u0D6F\\u0E50-\\u0E59\\u0ED0-\\u0ED9\\u0F20-\\u0F29'; const extender = '\\xB7\\u02D0\\u02D1\\u0387\\u0640\\u0E46\\u0EC6\\u3005\\u3031-\\u3035\\u309D\\u309E\\u30FC-\\u30FE'; const letter = 'A-Za-z\\xC0-\\xD6\\xD8-\\xF6\\xF8-\\u0131\\u0134-\\u013E\\u0141-\\u0148\\u014A-\\u017E\\u0180-\\u01C3\\u01CD-\\u01F0\\u01F4\\u01F5\\u01FA-\\u0217\\u0250-\\u02A8\\u02BB-\\u02C1\\u0386\\u0388-\\u038A\\u038C\\u038E-\\u03A1\\u03A3-\\u03CE\\u03D0-\\u03D6\\u03DA\\u03DC\\u03DE\\u03E0\\u03E2-\\u03F3\\u0401-\\u040C\\u040E-\\u044F\\u0451-\\u045C\\u045E-\\u0481\\u0490-\\u04C4\\u04C7\\u04C8\\u04CB\\u04CC\\u04D0-\\u04EB\\u04EE-\\u04F5\\u04F8\\u04F9\\u0531-\\u0556\\u0559\\u0561-\\u0586\\u05D0-\\u05EA\\u05F0-\\u05F2\\u0621-\\u063A\\u0641-\\u064A\\u0671-\\u06B7\\u06BA-\\u06BE\\u06C0-\\u06CE\\u06D0-\\u06D3\\u06D5\\u06E5\\u06E6\\u0905-\\u0939\\u093D\\u0958-\\u0961\\u0985-\\u098C\\u098F\\u0990\\u0993-\\u09A8\\u09AA-\\u09B0\\u09B2\\u09B6-\\u09B9\\u09DC\\u09DD\\u09DF-\\u09E1\\u09F0\\u09F1\\u0A05-\\u0A0A\\u0A0F\\u0A10\\u0A13-\\u0A28\\u0A2A-\\u0A30\\u0A32\\u0A33\\u0A35\\u0A36\\u0A38\\u0A39\\u0A59-\\u0A5C\\u0A5E\\u0A72-\\u0A74\\u0A85-\\u0A8B\\u0A8D\\u0A8F-\\u0A91\\u0A93-\\u0AA8\\u0AAA-\\u0AB0\\u0AB2\\u0AB3\\u0AB5-\\u0AB9\\u0ABD\\u0AE0\\u0B05-\\u0B0C\\u0B0F\\u0B10\\u0B13-\\u0B28\\u0B2A-\\u0B30\\u0B32\\u0B33\\u0B36-\\u0B39\\u0B3D\\u0B5C\\u0B5D\\u0B5F-\\u0B61\\u0B85-\\u0B8A\\u0B8E-\\u0B90\\u0B92-\\u0B95\\u0B99\\u0B9A\\u0B9C\\u0B9E\\u0B9F\\u0BA3\\u0BA4\\u0BA8-\\u0BAA\\u0BAE-\\u0BB5\\u0BB7-\\u0BB9\\u0C05-\\u0C0C\\u0C0E-\\u0C10\\u0C12-\\u0C28\\u0C2A-\\u0C33\\u0C35-\\u0C39\\u0C60\\u0C61\\u0C85-\\u0C8C\\u0C8E-\\u0C90\\u0C92-\\u0CA8\\u0CAA-\\u0CB3\\u0CB5-\\u0CB9\\u0CDE\\u0CE0\\u0CE1\\u0D05-\\u0D0C\\u0D0E-\\u0D10\\u0D12-\\u0D28\\u0D2A-\\u0D39\\u0D60\\u0D61\\u0E01-\\u0E2E\\u0E30\\u0E32\\u0E33\\u0E40-\\u0E45\\u0E81\\u0E82\\u0E84\\u0E87\\u0E88\\u0E8A\\u0E8D\\u0E94-\\u0E97\\u0E99-\\u0E9F\\u0EA1-\\u0EA3\\u0EA5\\u0EA7\\u0EAA\\u0EAB\\u0EAD\\u0EAE\\u0EB0\\u0EB2\\u0EB3\\u0EBD\\u0EC0-\\u0EC4\\u0F40-\\u0F47\\u0F49-\\u0F69\\u10A0-\\u10C5\\u10D0-\\u10F6\\u1100\\u1102\\u1103\\u1105-\\u1107\\u1109\\u110B\\u110C\\u110E-\\u1112\\u113C\\u113E\\u1140\\u114C\\u114E\\u1150\\u1154\\u1155\\u1159\\u115F-\\u1161\\u1163\\u1165\\u1167\\u1169\\u116D\\u116E\\u1172\\u1173\\u1175\\u119E\\u11A8\\u11AB\\u11AE\\u11AF\\u11B7\\u11B8\\u11BA\\u11BC-\\u11C2\\u11EB\\u11F0\\u11F9\\u1E00-\\u1E9B\\u1EA0-\\u1EF9\\u1F00-\\u1F15\\u1F18-\\u1F1D\\u1F20-\\u1F45\\u1F48-\\u1F4D\\u1F50-\\u1F57\\u1F59\\u1F5B\\u1F5D\\u1F5F-\\u1F7D\\u1F80-\\u1FB4\\u1FB6-\\u1FBC\\u1FBE\\u1FC2-\\u1FC4\\u1FC6-\\u1FCC\\u1FD0-\\u1FD3\\u1FD6-\\u1FDB\\u1FE0-\\u1FEC\\u1FF2-\\u1FF4\\u1FF6-\\u1FFC\\u2126\\u212A\\u212B\\u212E\\u2180-\\u2182\\u3007\\u3021-\\u3029\\u3041-\\u3094\\u30A1-\\u30FA\\u3105-\\u312C\\u4E00-\\u9FA5\\uAC00-\\uD7A3'; const ncname = '[' + letter + '_][' + letter + digit + '\\.\\-_' + combiningChar + extender + ']*'; return '((?:' + ncname + '\\:)?' + ncname + ')'; })(); const startTagOpen = new RegExp('^<' + qnameCapture); const startTagClose = /^\s*(\/?)>/; const endTag = new RegExp('^<\\/' + qnameCapture + '[^>]*>'); const doctype = /^]+>/i; let IS_REGEX_CAPTURING_BROKEN = false; 'x'.replace(/x(.)?/g, function (m, g) { IS_REGEX_CAPTURING_BROKEN = g === ''; }); // Empty Elements const empty = new CaseInsensitiveSet(['area', 'base', 'basefont', 'br', 'col', 'embed', 'frame', 'hr', 'img', 'input', 'isindex', 'keygen', 'link', 'meta', 'param', 'source', 'track', 'wbr']); // Inline Elements const inline = new CaseInsensitiveSet(['a', 'abbr', 'acronym', 'applet', 'b', 'basefont', 'bdo', 'big', 'br', 'button', 'cite', 'code', 'del', 'dfn', 'em', 'font', 'i', 'iframe', 'img', 'input', 'ins', 'kbd', 'label', 'map', 'noscript', 'object', 'q', 's', 'samp', 'script', 'select', 'small', 'span', 'strike', 'strong', 'sub', 'sup', 'svg', 'textarea', 'tt', 'u', 'var']); // Elements that you can, intentionally, leave open // (and which close themselves) const closeSelf = new CaseInsensitiveSet(['colgroup', 'dd', 'dt', 'li', 'option', 'p', 'td', 'tfoot', 'th', 'thead', 'tr', 'source']); // Attributes that have their values filled in disabled='disabled' const fillAttrs = new CaseInsensitiveSet(['checked', 'compact', 'declare', 'defer', 'disabled', 'ismap', 'multiple', 'nohref', 'noresize', 'noshade', 'nowrap', 'readonly', 'selected']); // Special Elements (can contain anything) const special = new CaseInsensitiveSet(['script', 'style']); // HTML5 tags https://html.spec.whatwg.org/multipage/indices.html#elements-3 // Phrasing Content https://html.spec.whatwg.org/multipage/dom.html#phrasing-content const nonPhrasing = new CaseInsensitiveSet(['address', 'article', 'aside', 'base', 'blockquote', 'body', 'caption', 'col', 'colgroup', 'dd', 'details', 'dialog', 'div', 'dl', 'dt', 'fieldset', 'figcaption', 'figure', 'footer', 'form', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'head', 'header', 'hgroup', 'hr', 'html', 'legend', 'li', 'menuitem', 'meta', 'ol', 'optgroup', 'option', 'param', 'rp', 'rt', 'source', 'style', 'summary', 'tbody', 'td', 'tfoot', 'th', 'thead', 'title', 'tr', 'track', 'ul']); const reCache = {}; function attrForHandler(handler) { let pattern = singleAttrIdentifier.source + '(?:\\s*(' + joinSingleAttrAssigns(handler) + ')' + '[ \\t\\n\\f\\r]*(?:' + singleAttrValues.join('|') + '))?'; if (handler.customAttrSurround) { const attrClauses = []; for (let i = handler.customAttrSurround.length - 1; i >= 0; i--) { attrClauses[i] = '(?:' + '(' + handler.customAttrSurround[i][0].source + ')\\s*' + pattern + '\\s*(' + handler.customAttrSurround[i][1].source + ')' + ')'; } attrClauses.push('(?:' + pattern + ')'); pattern = '(?:' + attrClauses.join('|') + ')'; } return new RegExp('^\\s*' + pattern); } function joinSingleAttrAssigns(handler) { return singleAttrAssigns.concat( handler.customAttrAssign || [] ).map(function (assign) { return '(?:' + assign.source + ')'; }).join('|'); } class HTMLParser { constructor(html, handler) { this.html = html; this.handler = handler; } async parse() { let html = this.html; const handler = this.handler; const stack = []; let lastTag; const attribute = attrForHandler(handler); let last, prevTag, nextTag; while (html) { last = html; // Make sure we're not in a script or style element if (!lastTag || !special.has(lastTag)) { let textEnd = html.indexOf('<'); if (textEnd === 0) { // Comment: if (/^'); if (commentEnd >= 0) { if (handler.comment) { await handler.comment(html.substring(4, commentEnd)); } html = html.substring(commentEnd + 3); prevTag = ''; continue; } } // https://en.wikipedia.org/wiki/Conditional_comment#Downlevel-revealed_conditional_comment if (/^'); if (conditionalEnd >= 0) { if (handler.comment) { await handler.comment(html.substring(2, conditionalEnd + 1), true /* non-standard */); } html = html.substring(conditionalEnd + 2); prevTag = ''; continue; } } // Doctype: const doctypeMatch = html.match(doctype); if (doctypeMatch) { if (handler.doctype) { handler.doctype(doctypeMatch[0]); } html = html.substring(doctypeMatch[0].length); prevTag = ''; continue; } // End tag: const endTagMatch = html.match(endTag); if (endTagMatch) { html = html.substring(endTagMatch[0].length); await replaceAsync(endTagMatch[0], endTag, parseEndTag); prevTag = '/' + endTagMatch[1].toLowerCase(); continue; } // Start tag: const startTagMatch = parseStartTag(html); if (startTagMatch) { html = startTagMatch.rest; await handleStartTag(startTagMatch); prevTag = startTagMatch.tagName.toLowerCase(); continue; } // Treat `<` as text if (handler.continueOnParseError) { textEnd = html.indexOf('<', 1); } } let text; if (textEnd >= 0) { text = html.substring(0, textEnd); html = html.substring(textEnd); } else { text = html; html = ''; } // next tag let nextTagMatch = parseStartTag(html); if (nextTagMatch) { nextTag = nextTagMatch.tagName; } else { nextTagMatch = html.match(endTag); if (nextTagMatch) { nextTag = '/' + nextTagMatch[1]; } else { nextTag = ''; } } if (handler.chars) { await handler.chars(text, prevTag, nextTag); } prevTag = ''; } else { const stackedTag = lastTag.toLowerCase(); const reStackedTag = reCache[stackedTag] || (reCache[stackedTag] = new RegExp('([\\s\\S]*?)' + stackedTag + '[^>]*>', 'i')); html = await replaceAsync(html, reStackedTag, async (_, text) => { if (stackedTag !== 'script' && stackedTag !== 'style' && stackedTag !== 'noscript') { text = text .replace(//g, '$1') .replace(//g, '$1'); } if (handler.chars) { await handler.chars(text); } return ''; }); await parseEndTag('' + stackedTag + '>', stackedTag); } if (html === last) { throw new Error('Parse Error: ' + html); } } if (!handler.partialMarkup) { // Clean up any remaining tags await parseEndTag(); } function parseStartTag(input) { const start = input.match(startTagOpen); if (start) { const match = { tagName: start[1], attrs: [] }; input = input.slice(start[0].length); let end, attr; while (!(end = input.match(startTagClose)) && (attr = input.match(attribute))) { input = input.slice(attr[0].length); match.attrs.push(attr); } if (end) { match.unarySlash = end[1]; match.rest = input.slice(end[0].length); return match; } } } async function closeIfFound(tagName) { if (findTag(tagName) >= 0) { await parseEndTag('', tagName); return true; } } async function handleStartTag(match) { const tagName = match.tagName; let unarySlash = match.unarySlash; if (handler.html5) { if (lastTag === 'p' && nonPhrasing.has(tagName)) { await parseEndTag('', lastTag); } else if (tagName === 'tbody') { await closeIfFound('thead'); } else if (tagName === 'tfoot') { if (!await closeIfFound('tbody')) { await closeIfFound('thead'); } } if (tagName === 'col' && findTag('colgroup') < 0) { lastTag = 'colgroup'; stack.push({ tag: lastTag, attrs: [] }); if (handler.start) { await handler.start(lastTag, [], false, ''); } } } if (!handler.html5 && !inline.has(tagName)) { while (lastTag && inline.has(lastTag)) { await parseEndTag('', lastTag); } } if (closeSelf.has(tagName) && lastTag === tagName) { await parseEndTag('', tagName); } const unary = empty.has(tagName) || (tagName === 'html' && lastTag === 'head') || !!unarySlash; const attrs = match.attrs.map(function (args) { let name, value, customOpen, customClose, customAssign, quote; const ncp = 7; // number of captured parts, scalar // hackish work around FF bug https://bugzilla.mozilla.org/show_bug.cgi?id=369778 if (IS_REGEX_CAPTURING_BROKEN && args[0].indexOf('""') === -1) { if (args[3] === '') { delete args[3]; } if (args[4] === '') { delete args[4]; } if (args[5] === '') { delete args[5]; } } function populate(index) { customAssign = args[index]; value = args[index + 1]; if (typeof value !== 'undefined') { return '"'; } value = args[index + 2]; if (typeof value !== 'undefined') { return '\''; } value = args[index + 3]; if (typeof value === 'undefined' && fillAttrs.has(name)) { value = name; } return ''; } let j = 1; if (handler.customAttrSurround) { for (let i = 0, l = handler.customAttrSurround.length; i < l; i++, j += ncp) { name = args[j + 1]; if (name) { quote = populate(j + 2); customOpen = args[j]; customClose = args[j + 6]; break; } } } if (!name && (name = args[j])) { quote = populate(j + 1); } return { name, value, customAssign: customAssign || '=', customOpen: customOpen || '', customClose: customClose || '', quote: quote || '' }; }); if (!unary) { stack.push({ tag: tagName, attrs }); lastTag = tagName; unarySlash = ''; } if (handler.start) { await handler.start(tagName, attrs, unary, unarySlash); } } function findTag(tagName) { let pos; const needle = tagName.toLowerCase(); for (pos = stack.length - 1; pos >= 0; pos--) { if (stack[pos].tag.toLowerCase() === needle) { break; } } return pos; } async function parseEndTag(tag, tagName) { let pos; // Find the closest opened tag of the same type if (tagName) { pos = findTag(tagName); } else { // If no tag name is provided, clean shop pos = 0; } if (pos >= 0) { // Close all the open elements, up the stack for (let i = stack.length - 1; i >= pos; i--) { if (handler.end) { handler.end(stack[i].tag, stack[i].attrs, i > pos || !tag); } } // Remove the open elements from the stack stack.length = pos; lastTag = pos && stack[pos - 1].tag; } else if (tagName.toLowerCase() === 'br') { if (handler.start) { await handler.start(tagName, [], true, ''); } } else if (tagName.toLowerCase() === 'p') { if (handler.start) { await handler.start(tagName, [], false, '', true); } if (handler.end) { handler.end(tagName, []); } } } } } class Sorter { sort(tokens, fromIndex = 0) { for (let i = 0, len = this.keys.length; i < len; i++) { const key = this.keys[i]; const token = key.slice(1); let index = tokens.indexOf(token, fromIndex); if (index !== -1) { do { if (index !== fromIndex) { tokens.splice(index, 1); tokens.splice(fromIndex, 0, token); } fromIndex++; } while ((index = tokens.indexOf(token, fromIndex)) !== -1); return this[key].sort(tokens, fromIndex); } } return tokens; } } class TokenChain { add(tokens) { tokens.forEach((token) => { const key = '$' + token; if (!this[key]) { this[key] = []; this[key].processed = 0; } this[key].push(tokens); }); } createSorter() { const sorter = new Sorter(); sorter.keys = Object.keys(this).sort((j, k) => { const m = this[j].length; const n = this[k].length; return m < n ? 1 : m > n ? -1 : j < k ? -1 : j > k ? 1 : 0; }).filter((key) => { if (this[key].processed < this[key].length) { const token = key.slice(1); const chain = new TokenChain(); this[key].forEach((tokens) => { let index; while ((index = tokens.indexOf(token)) !== -1) { tokens.splice(index, 1); } tokens.forEach((token) => { this['$' + token].processed++; }); chain.add(tokens.slice(0)); }); sorter[key] = chain.createSorter(); return true; } return false; }); return sorter; } } function trimWhitespace(str) { return str && str.replace(/^[ \n\r\t\f]+/, '').replace(/[ \n\r\t\f]+$/, ''); } function collapseWhitespaceAll(str) { // Non-breaking space is specifically handled inside the replacer function here: return str && str.replace(/[ \n\r\t\f\xA0]+/g, function (spaces) { return spaces === '\t' ? '\t' : spaces.replace(/(^|\xA0+)[^\xA0]+/g, '$1 '); }); } function collapseWhitespace(str, options, trimLeft, trimRight, collapseAll) { let lineBreakBefore = ''; let lineBreakAfter = ''; if (options.preserveLineBreaks) { str = str.replace(/^[ \n\r\t\f]*?[\n\r][ \n\r\t\f]*/, function () { lineBreakBefore = '\n'; return ''; }).replace(/[ \n\r\t\f]*?[\n\r][ \n\r\t\f]*$/, function () { lineBreakAfter = '\n'; return ''; }); } if (trimLeft) { // Non-breaking space is specifically handled inside the replacer function here: str = str.replace(/^[ \n\r\t\f\xA0]+/, function (spaces) { const conservative = !lineBreakBefore && options.conservativeCollapse; if (conservative && spaces === '\t') { return '\t'; } return spaces.replace(/^[^\xA0]+/, '').replace(/(\xA0+)[^\xA0]+/g, '$1 ') || (conservative ? ' ' : ''); }); } if (trimRight) { // Non-breaking space is specifically handled inside the replacer function here: str = str.replace(/[ \n\r\t\f\xA0]+$/, function (spaces) { const conservative = !lineBreakAfter && options.conservativeCollapse; if (conservative && spaces === '\t') { return '\t'; } return spaces.replace(/[^\xA0]+(\xA0+)/g, ' $1').replace(/[^\xA0]+$/, '') || (conservative ? ' ' : ''); }); } if (collapseAll) { // strip non space whitespace then compress spaces to one str = collapseWhitespaceAll(str); } return lineBreakBefore + str + lineBreakAfter; } // non-empty tags that will maintain whitespace around them const inlineTags = new Set(['a', 'abbr', 'acronym', 'b', 'bdi', 'bdo', 'big', 'button', 'cite', 'code', 'del', 'dfn', 'em', 'font', 'i', 'ins', 'kbd', 'label', 'mark', 'math', 'nobr', 'object', 'q', 'rp', 'rt', 'rtc', 'ruby', 's', 'samp', 'select', 'small', 'span', 'strike', 'strong', 'sub', 'sup', 'svg', 'textarea', 'time', 'tt', 'u', 'var']); // non-empty tags that will maintain whitespace within them const inlineTextTags = new Set(['a', 'abbr', 'acronym', 'b', 'big', 'del', 'em', 'font', 'i', 'ins', 'kbd', 'mark', 'nobr', 'rp', 's', 'samp', 'small', 'span', 'strike', 'strong', 'sub', 'sup', 'time', 'tt', 'u', 'var']); // self-closing tags that will maintain whitespace around them const selfClosingInlineTags = new Set(['comment', 'img', 'input', 'wbr']); function collapseWhitespaceSmart(str, prevTag, nextTag, options) { let trimLeft = prevTag && !selfClosingInlineTags.has(prevTag); if (trimLeft && !options.collapseInlineTagWhitespace) { trimLeft = prevTag.charAt(0) === '/' ? !inlineTags.has(prevTag.slice(1)) : !inlineTextTags.has(prevTag); } let trimRight = nextTag && !selfClosingInlineTags.has(nextTag); if (trimRight && !options.collapseInlineTagWhitespace) { trimRight = nextTag.charAt(0) === '/' ? !inlineTextTags.has(nextTag.slice(1)) : !inlineTags.has(nextTag); } return collapseWhitespace(str, options, trimLeft, trimRight, prevTag && nextTag); } function isConditionalComment(text) { return /^\[if\s[^\]]+]|\[endif]$/.test(text); } function isIgnoredComment(text, options) { for (let i = 0, len = options.ignoreCustomComments.length; i < len; i++) { if (options.ignoreCustomComments[i].test(text)) { return true; } } return false; } function isEventAttribute(attrName, options) { const patterns = options.customEventAttributes; if (patterns) { for (let i = patterns.length; i--;) { if (patterns[i].test(attrName)) { return true; } } return false; } return /^on[a-z]{3,}$/.test(attrName); } function canRemoveAttributeQuotes(value) { // https://mathiasbynens.be/notes/unquoted-attribute-values return /^[^ \t\n\f\r"'`=<>]+$/.test(value); } function attributesInclude(attributes, attribute) { for (let i = attributes.length; i--;) { if (attributes[i].name.toLowerCase() === attribute) { return true; } } return false; } function isAttributeRedundant(tag, attrName, attrValue, attrs) { attrValue = attrValue ? trimWhitespace(attrValue.toLowerCase()) : ''; return ( (tag === 'script' && attrName === 'language' && attrValue === 'javascript') || (tag === 'form' && attrName === 'method' && attrValue === 'get') || (tag === 'input' && attrName === 'type' && attrValue === 'text') || (tag === 'script' && attrName === 'charset' && !attributesInclude(attrs, 'src')) || (tag === 'a' && attrName === 'name' && attributesInclude(attrs, 'id')) || (tag === 'area' && attrName === 'shape' && attrValue === 'rect') ); } // https://mathiasbynens.be/demo/javascript-mime-type // https://developer.mozilla.org/en/docs/Web/HTML/Element/script#attr-type const executableScriptsMimetypes = new Set([ 'text/javascript', 'text/ecmascript', 'text/jscript', 'application/javascript', 'application/x-javascript', 'application/ecmascript', 'module' ]); const keepScriptsMimetypes = new Set([ 'module' ]); function isScriptTypeAttribute(attrValue = '') { attrValue = trimWhitespace(attrValue.split(/;/, 2)[0]).toLowerCase(); return attrValue === '' || executableScriptsMimetypes.has(attrValue); } function keepScriptTypeAttribute(attrValue = '') { attrValue = trimWhitespace(attrValue.split(/;/, 2)[0]).toLowerCase(); return keepScriptsMimetypes.has(attrValue); } function isExecutableScript(tag, attrs) { if (tag !== 'script') { return false; } for (let i = 0, len = attrs.length; i < len; i++) { const attrName = attrs[i].name.toLowerCase(); if (attrName === 'type') { return isScriptTypeAttribute(attrs[i].value); } } return true; } function isStyleLinkTypeAttribute(attrValue = '') { attrValue = trimWhitespace(attrValue).toLowerCase(); return attrValue === '' || attrValue === 'text/css'; } function isStyleSheet(tag, attrs) { if (tag !== 'style') { return false; } for (let i = 0, len = attrs.length; i < len; i++) { const attrName = attrs[i].name.toLowerCase(); if (attrName === 'type') { return isStyleLinkTypeAttribute(attrs[i].value); } } return true; } const isSimpleBoolean = new Set(['allowfullscreen', 'async', 'autofocus', 'autoplay', 'checked', 'compact', 'controls', 'declare', 'default', 'defaultchecked', 'defaultmuted', 'defaultselected', 'defer', 'disabled', 'enabled', 'formnovalidate', 'hidden', 'indeterminate', 'inert', 'ismap', 'itemscope', 'loop', 'multiple', 'muted', 'nohref', 'noresize', 'noshade', 'novalidate', 'nowrap', 'open', 'pauseonexit', 'readonly', 'required', 'reversed', 'scoped', 'seamless', 'selected', 'sortable', 'truespeed', 'typemustmatch', 'visible']); const isBooleanValue = new Set(['true', 'false']); function isBooleanAttribute(attrName, attrValue) { return isSimpleBoolean.has(attrName) || (attrName === 'draggable' && !isBooleanValue.has(attrValue)); } function isUriTypeAttribute(attrName, tag) { return ( (/^(?:a|area|link|base)$/.test(tag) && attrName === 'href') || (tag === 'img' && /^(?:src|longdesc|usemap)$/.test(attrName)) || (tag === 'object' && /^(?:classid|codebase|data|usemap)$/.test(attrName)) || (tag === 'q' && attrName === 'cite') || (tag === 'blockquote' && attrName === 'cite') || ((tag === 'ins' || tag === 'del') && attrName === 'cite') || (tag === 'form' && attrName === 'action') || (tag === 'input' && (attrName === 'src' || attrName === 'usemap')) || (tag === 'head' && attrName === 'profile') || (tag === 'script' && (attrName === 'src' || attrName === 'for')) ); } function isNumberTypeAttribute(attrName, tag) { return ( (/^(?:a|area|object|button)$/.test(tag) && attrName === 'tabindex') || (tag === 'input' && (attrName === 'maxlength' || attrName === 'tabindex')) || (tag === 'select' && (attrName === 'size' || attrName === 'tabindex')) || (tag === 'textarea' && /^(?:rows|cols|tabindex)$/.test(attrName)) || (tag === 'colgroup' && attrName === 'span') || (tag === 'col' && attrName === 'span') || ((tag === 'th' || tag === 'td') && (attrName === 'rowspan' || attrName === 'colspan')) ); } function isLinkType(tag, attrs, value) { if (tag !== 'link') { return false; } for (let i = 0, len = attrs.length; i < len; i++) { if (attrs[i].name === 'rel' && attrs[i].value === value) { return true; } } } function isMediaQuery(tag, attrs, attrName) { return attrName === 'media' && (isLinkType(tag, attrs, 'stylesheet') || isStyleSheet(tag, attrs)); } const srcsetTags = new Set(['img', 'source']); function isSrcset(attrName, tag) { return attrName === 'srcset' && srcsetTags.has(tag); } async function cleanAttributeValue(tag, attrName, attrValue, options, attrs) { if (isEventAttribute(attrName, options)) { attrValue = trimWhitespace(attrValue).replace(/^javascript:\s*/i, ''); return options.minifyJS(attrValue, true); } else if (attrName === 'class') { attrValue = trimWhitespace(attrValue); if (options.sortClassName) { attrValue = options.sortClassName(attrValue); } else { attrValue = collapseWhitespaceAll(attrValue); } return attrValue; } else if (isUriTypeAttribute(attrName, tag)) { attrValue = trimWhitespace(attrValue); return isLinkType(tag, attrs, 'canonical') ? attrValue : options.minifyURLs(attrValue); } else if (isNumberTypeAttribute(attrName, tag)) { return trimWhitespace(attrValue); } else if (attrName === 'style') { attrValue = trimWhitespace(attrValue); if (attrValue) { if (/;$/.test(attrValue) && !/?[0-9a-zA-Z]+;$/.test(attrValue)) { attrValue = attrValue.replace(/\s*;$/, ';'); } attrValue = await options.minifyCSS(attrValue, 'inline'); } return attrValue; } else if (isSrcset(attrName, tag)) { // https://html.spec.whatwg.org/multipage/embedded-content.html#attr-img-srcset attrValue = trimWhitespace(attrValue).split(/\s+,\s*|\s*,\s+/).map(function (candidate) { let url = candidate; let descriptor = ''; const match = candidate.match(/\s+([1-9][0-9]*w|[0-9]+(?:\.[0-9]+)?x)$/); if (match) { url = url.slice(0, -match[0].length); const num = +match[1].slice(0, -1); const suffix = match[1].slice(-1); if (num !== 1 || suffix !== 'x') { descriptor = ' ' + num + suffix; } } return options.minifyURLs(url) + descriptor; }).join(', '); } else if (isMetaViewport(tag, attrs) && attrName === 'content') { attrValue = attrValue.replace(/\s+/g, '').replace(/[0-9]+\.[0-9]+/g, function (numString) { // "0.90000" -> "0.9" // "1.0" -> "1" // "1.0001" -> "1.0001" (unchanged) return (+numString).toString(); }); } else if (isContentSecurityPolicy(tag, attrs) && attrName.toLowerCase() === 'content') { return collapseWhitespaceAll(attrValue); } else if (options.customAttrCollapse && options.customAttrCollapse.test(attrName)) { attrValue = trimWhitespace(attrValue.replace(/ ?[\n\r]+ ?/g, '').replace(/\s{2,}/g, options.conservativeCollapse ? ' ' : '')); } else if (tag === 'script' && attrName === 'type') { attrValue = trimWhitespace(attrValue.replace(/\s*;\s*/g, ';')); } else if (isMediaQuery(tag, attrs, attrName)) { attrValue = trimWhitespace(attrValue); return options.minifyCSS(attrValue, 'media'); } return attrValue; } function isMetaViewport(tag, attrs) { if (tag !== 'meta') { return false; } for (let i = 0, len = attrs.length; i < len; i++) { if (attrs[i].name === 'name' && attrs[i].value === 'viewport') { return true; } } } function isContentSecurityPolicy(tag, attrs) { if (tag !== 'meta') { return false; } for (let i = 0, len = attrs.length; i < len; i++) { if (attrs[i].name.toLowerCase() === 'http-equiv' && attrs[i].value.toLowerCase() === 'content-security-policy') { return true; } } } function ignoreCSS(id) { return '/* clean-css ignore:start */' + id + '/* clean-css ignore:end */'; } // Wrap CSS declarations for CleanCSS > 3.x // See https://github.com/jakubpawlowicz/clean-css/issues/418 function wrapCSS(text, type) { switch (type) { case 'inline': return '*{' + text + '}'; case 'media': return '@media ' + text + '{a{top:0}}'; default: return text; } } function unwrapCSS(text, type) { let matches; switch (type) { case 'inline': matches = text.match(/^\*\{([\s\S]*)\}$/); break; case 'media': matches = text.match(/^@media ([\s\S]*?)\s*{[\s\S]*}$/); break; } return matches ? matches[1] : text; } async function cleanConditionalComment(comment, options) { return options.processConditionalComments ? await replaceAsync(comment, /^(\[if\s[^\]]+]>)([\s\S]*?)( -1) { return await minifyHTML(text, options); } } return text; } // Tag omission rules from https://html.spec.whatwg.org/multipage/syntax.html#optional-tags // with the following deviations: // - retain
if followed by