mirror of
https://github.com/Snigdha-OS/documentation.git
synced 2025-09-07 19:25:13 +02:00
1367 lines
47 KiB
JavaScript
1367 lines
47 KiB
JavaScript
import CleanCSS from 'clean-css';
|
|
import { decodeHTMLStrict, decodeHTML } from 'entities';
|
|
import RelateURL from 'relateurl';
|
|
import { minify as terser } from 'terser';
|
|
|
|
import { HTMLParser, endTag } from './htmlparser.js';
|
|
import TokenChain from './tokenchain.js';
|
|
import { replaceAsync } from './utils.js';
|
|
|
|
function trimWhitespace(str) {
|
|
return str && str.replace(/^[ \n\r\t\f]+/, '').replace(/[ \n\r\t\f]+$/, '');
|
|
}
|
|
|
|
function collapseWhitespaceAll(str) {
|
|
// Non-breaking space is specifically handled inside the replacer function here:
|
|
return str && str.replace(/[ \n\r\t\f\xA0]+/g, function (spaces) {
|
|
return spaces === '\t' ? '\t' : spaces.replace(/(^|\xA0+)[^\xA0]+/g, '$1 ');
|
|
});
|
|
}
|
|
|
|
function collapseWhitespace(str, options, trimLeft, trimRight, collapseAll) {
|
|
let lineBreakBefore = ''; let lineBreakAfter = '';
|
|
|
|
if (options.preserveLineBreaks) {
|
|
str = str.replace(/^[ \n\r\t\f]*?[\n\r][ \n\r\t\f]*/, function () {
|
|
lineBreakBefore = '\n';
|
|
return '';
|
|
}).replace(/[ \n\r\t\f]*?[\n\r][ \n\r\t\f]*$/, function () {
|
|
lineBreakAfter = '\n';
|
|
return '';
|
|
});
|
|
}
|
|
|
|
if (trimLeft) {
|
|
// Non-breaking space is specifically handled inside the replacer function here:
|
|
str = str.replace(/^[ \n\r\t\f\xA0]+/, function (spaces) {
|
|
const conservative = !lineBreakBefore && options.conservativeCollapse;
|
|
if (conservative && spaces === '\t') {
|
|
return '\t';
|
|
}
|
|
return spaces.replace(/^[^\xA0]+/, '').replace(/(\xA0+)[^\xA0]+/g, '$1 ') || (conservative ? ' ' : '');
|
|
});
|
|
}
|
|
|
|
if (trimRight) {
|
|
// Non-breaking space is specifically handled inside the replacer function here:
|
|
str = str.replace(/[ \n\r\t\f\xA0]+$/, function (spaces) {
|
|
const conservative = !lineBreakAfter && options.conservativeCollapse;
|
|
if (conservative && spaces === '\t') {
|
|
return '\t';
|
|
}
|
|
return spaces.replace(/[^\xA0]+(\xA0+)/g, ' $1').replace(/[^\xA0]+$/, '') || (conservative ? ' ' : '');
|
|
});
|
|
}
|
|
|
|
if (collapseAll) {
|
|
// strip non space whitespace then compress spaces to one
|
|
str = collapseWhitespaceAll(str);
|
|
}
|
|
|
|
return lineBreakBefore + str + lineBreakAfter;
|
|
}
|
|
|
|
// non-empty tags that will maintain whitespace around them
|
|
const inlineTags = new Set(['a', 'abbr', 'acronym', 'b', 'bdi', 'bdo', 'big', 'button', 'cite', 'code', 'del', 'dfn', 'em', 'font', 'i', 'ins', 'kbd', 'label', 'mark', 'math', 'nobr', 'object', 'q', 'rp', 'rt', 'rtc', 'ruby', 's', 'samp', 'select', 'small', 'span', 'strike', 'strong', 'sub', 'sup', 'svg', 'textarea', 'time', 'tt', 'u', 'var']);
|
|
// non-empty tags that will maintain whitespace within them
|
|
const inlineTextTags = new Set(['a', 'abbr', 'acronym', 'b', 'big', 'del', 'em', 'font', 'i', 'ins', 'kbd', 'mark', 'nobr', 'rp', 's', 'samp', 'small', 'span', 'strike', 'strong', 'sub', 'sup', 'time', 'tt', 'u', 'var']);
|
|
// self-closing tags that will maintain whitespace around them
|
|
const selfClosingInlineTags = new Set(['comment', 'img', 'input', 'wbr']);
|
|
|
|
function collapseWhitespaceSmart(str, prevTag, nextTag, options) {
|
|
let trimLeft = prevTag && !selfClosingInlineTags.has(prevTag);
|
|
if (trimLeft && !options.collapseInlineTagWhitespace) {
|
|
trimLeft = prevTag.charAt(0) === '/' ? !inlineTags.has(prevTag.slice(1)) : !inlineTextTags.has(prevTag);
|
|
}
|
|
let trimRight = nextTag && !selfClosingInlineTags.has(nextTag);
|
|
if (trimRight && !options.collapseInlineTagWhitespace) {
|
|
trimRight = nextTag.charAt(0) === '/' ? !inlineTextTags.has(nextTag.slice(1)) : !inlineTags.has(nextTag);
|
|
}
|
|
return collapseWhitespace(str, options, trimLeft, trimRight, prevTag && nextTag);
|
|
}
|
|
|
|
function isConditionalComment(text) {
|
|
return /^\[if\s[^\]]+]|\[endif]$/.test(text);
|
|
}
|
|
|
|
function isIgnoredComment(text, options) {
|
|
for (let i = 0, len = options.ignoreCustomComments.length; i < len; i++) {
|
|
if (options.ignoreCustomComments[i].test(text)) {
|
|
return true;
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
function isEventAttribute(attrName, options) {
|
|
const patterns = options.customEventAttributes;
|
|
if (patterns) {
|
|
for (let i = patterns.length; i--;) {
|
|
if (patterns[i].test(attrName)) {
|
|
return true;
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
return /^on[a-z]{3,}$/.test(attrName);
|
|
}
|
|
|
|
function canRemoveAttributeQuotes(value) {
|
|
// https://mathiasbynens.be/notes/unquoted-attribute-values
|
|
return /^[^ \t\n\f\r"'`=<>]+$/.test(value);
|
|
}
|
|
|
|
function attributesInclude(attributes, attribute) {
|
|
for (let i = attributes.length; i--;) {
|
|
if (attributes[i].name.toLowerCase() === attribute) {
|
|
return true;
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
function isAttributeRedundant(tag, attrName, attrValue, attrs) {
|
|
attrValue = attrValue ? trimWhitespace(attrValue.toLowerCase()) : '';
|
|
|
|
return (
|
|
(tag === 'script' &&
|
|
attrName === 'language' &&
|
|
attrValue === 'javascript') ||
|
|
|
|
(tag === 'form' &&
|
|
attrName === 'method' &&
|
|
attrValue === 'get') ||
|
|
|
|
(tag === 'input' &&
|
|
attrName === 'type' &&
|
|
attrValue === 'text') ||
|
|
|
|
(tag === 'script' &&
|
|
attrName === 'charset' &&
|
|
!attributesInclude(attrs, 'src')) ||
|
|
|
|
(tag === 'a' &&
|
|
attrName === 'name' &&
|
|
attributesInclude(attrs, 'id')) ||
|
|
|
|
(tag === 'area' &&
|
|
attrName === 'shape' &&
|
|
attrValue === 'rect')
|
|
);
|
|
}
|
|
|
|
// https://mathiasbynens.be/demo/javascript-mime-type
|
|
// https://developer.mozilla.org/en/docs/Web/HTML/Element/script#attr-type
|
|
const executableScriptsMimetypes = new Set([
|
|
'text/javascript',
|
|
'text/ecmascript',
|
|
'text/jscript',
|
|
'application/javascript',
|
|
'application/x-javascript',
|
|
'application/ecmascript',
|
|
'module'
|
|
]);
|
|
|
|
const keepScriptsMimetypes = new Set([
|
|
'module'
|
|
]);
|
|
|
|
function isScriptTypeAttribute(attrValue = '') {
|
|
attrValue = trimWhitespace(attrValue.split(/;/, 2)[0]).toLowerCase();
|
|
return attrValue === '' || executableScriptsMimetypes.has(attrValue);
|
|
}
|
|
|
|
function keepScriptTypeAttribute(attrValue = '') {
|
|
attrValue = trimWhitespace(attrValue.split(/;/, 2)[0]).toLowerCase();
|
|
return keepScriptsMimetypes.has(attrValue);
|
|
}
|
|
|
|
function isExecutableScript(tag, attrs) {
|
|
if (tag !== 'script') {
|
|
return false;
|
|
}
|
|
for (let i = 0, len = attrs.length; i < len; i++) {
|
|
const attrName = attrs[i].name.toLowerCase();
|
|
if (attrName === 'type') {
|
|
return isScriptTypeAttribute(attrs[i].value);
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
function isStyleLinkTypeAttribute(attrValue = '') {
|
|
attrValue = trimWhitespace(attrValue).toLowerCase();
|
|
return attrValue === '' || attrValue === 'text/css';
|
|
}
|
|
|
|
function isStyleSheet(tag, attrs) {
|
|
if (tag !== 'style') {
|
|
return false;
|
|
}
|
|
for (let i = 0, len = attrs.length; i < len; i++) {
|
|
const attrName = attrs[i].name.toLowerCase();
|
|
if (attrName === 'type') {
|
|
return isStyleLinkTypeAttribute(attrs[i].value);
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
const isSimpleBoolean = new Set(['allowfullscreen', 'async', 'autofocus', 'autoplay', 'checked', 'compact', 'controls', 'declare', 'default', 'defaultchecked', 'defaultmuted', 'defaultselected', 'defer', 'disabled', 'enabled', 'formnovalidate', 'hidden', 'indeterminate', 'inert', 'ismap', 'itemscope', 'loop', 'multiple', 'muted', 'nohref', 'noresize', 'noshade', 'novalidate', 'nowrap', 'open', 'pauseonexit', 'readonly', 'required', 'reversed', 'scoped', 'seamless', 'selected', 'sortable', 'truespeed', 'typemustmatch', 'visible']);
|
|
const isBooleanValue = new Set(['true', 'false']);
|
|
|
|
function isBooleanAttribute(attrName, attrValue) {
|
|
return isSimpleBoolean.has(attrName) || (attrName === 'draggable' && !isBooleanValue.has(attrValue));
|
|
}
|
|
|
|
function isUriTypeAttribute(attrName, tag) {
|
|
return (
|
|
(/^(?:a|area|link|base)$/.test(tag) && attrName === 'href') ||
|
|
(tag === 'img' && /^(?:src|longdesc|usemap)$/.test(attrName)) ||
|
|
(tag === 'object' && /^(?:classid|codebase|data|usemap)$/.test(attrName)) ||
|
|
(tag === 'q' && attrName === 'cite') ||
|
|
(tag === 'blockquote' && attrName === 'cite') ||
|
|
((tag === 'ins' || tag === 'del') && attrName === 'cite') ||
|
|
(tag === 'form' && attrName === 'action') ||
|
|
(tag === 'input' && (attrName === 'src' || attrName === 'usemap')) ||
|
|
(tag === 'head' && attrName === 'profile') ||
|
|
(tag === 'script' && (attrName === 'src' || attrName === 'for'))
|
|
);
|
|
}
|
|
|
|
function isNumberTypeAttribute(attrName, tag) {
|
|
return (
|
|
(/^(?:a|area|object|button)$/.test(tag) && attrName === 'tabindex') ||
|
|
(tag === 'input' && (attrName === 'maxlength' || attrName === 'tabindex')) ||
|
|
(tag === 'select' && (attrName === 'size' || attrName === 'tabindex')) ||
|
|
(tag === 'textarea' && /^(?:rows|cols|tabindex)$/.test(attrName)) ||
|
|
(tag === 'colgroup' && attrName === 'span') ||
|
|
(tag === 'col' && attrName === 'span') ||
|
|
((tag === 'th' || tag === 'td') && (attrName === 'rowspan' || attrName === 'colspan'))
|
|
);
|
|
}
|
|
|
|
function isLinkType(tag, attrs, value) {
|
|
if (tag !== 'link') {
|
|
return false;
|
|
}
|
|
for (let i = 0, len = attrs.length; i < len; i++) {
|
|
if (attrs[i].name === 'rel' && attrs[i].value === value) {
|
|
return true;
|
|
}
|
|
}
|
|
}
|
|
|
|
function isMediaQuery(tag, attrs, attrName) {
|
|
return attrName === 'media' && (isLinkType(tag, attrs, 'stylesheet') || isStyleSheet(tag, attrs));
|
|
}
|
|
|
|
const srcsetTags = new Set(['img', 'source']);
|
|
|
|
function isSrcset(attrName, tag) {
|
|
return attrName === 'srcset' && srcsetTags.has(tag);
|
|
}
|
|
|
|
async function cleanAttributeValue(tag, attrName, attrValue, options, attrs) {
|
|
if (isEventAttribute(attrName, options)) {
|
|
attrValue = trimWhitespace(attrValue).replace(/^javascript:\s*/i, '');
|
|
return options.minifyJS(attrValue, true);
|
|
} else if (attrName === 'class') {
|
|
attrValue = trimWhitespace(attrValue);
|
|
if (options.sortClassName) {
|
|
attrValue = options.sortClassName(attrValue);
|
|
} else {
|
|
attrValue = collapseWhitespaceAll(attrValue);
|
|
}
|
|
return attrValue;
|
|
} else if (isUriTypeAttribute(attrName, tag)) {
|
|
attrValue = trimWhitespace(attrValue);
|
|
return isLinkType(tag, attrs, 'canonical') ? attrValue : options.minifyURLs(attrValue);
|
|
} else if (isNumberTypeAttribute(attrName, tag)) {
|
|
return trimWhitespace(attrValue);
|
|
} else if (attrName === 'style') {
|
|
attrValue = trimWhitespace(attrValue);
|
|
if (attrValue) {
|
|
if (/;$/.test(attrValue) && !/&#?[0-9a-zA-Z]+;$/.test(attrValue)) {
|
|
attrValue = attrValue.replace(/\s*;$/, ';');
|
|
}
|
|
attrValue = await options.minifyCSS(attrValue, 'inline');
|
|
}
|
|
return attrValue;
|
|
} else if (isSrcset(attrName, tag)) {
|
|
// https://html.spec.whatwg.org/multipage/embedded-content.html#attr-img-srcset
|
|
attrValue = trimWhitespace(attrValue).split(/\s+,\s*|\s*,\s+/).map(function (candidate) {
|
|
let url = candidate;
|
|
let descriptor = '';
|
|
const match = candidate.match(/\s+([1-9][0-9]*w|[0-9]+(?:\.[0-9]+)?x)$/);
|
|
if (match) {
|
|
url = url.slice(0, -match[0].length);
|
|
const num = +match[1].slice(0, -1);
|
|
const suffix = match[1].slice(-1);
|
|
if (num !== 1 || suffix !== 'x') {
|
|
descriptor = ' ' + num + suffix;
|
|
}
|
|
}
|
|
return options.minifyURLs(url) + descriptor;
|
|
}).join(', ');
|
|
} else if (isMetaViewport(tag, attrs) && attrName === 'content') {
|
|
attrValue = attrValue.replace(/\s+/g, '').replace(/[0-9]+\.[0-9]+/g, function (numString) {
|
|
// "0.90000" -> "0.9"
|
|
// "1.0" -> "1"
|
|
// "1.0001" -> "1.0001" (unchanged)
|
|
return (+numString).toString();
|
|
});
|
|
} else if (isContentSecurityPolicy(tag, attrs) && attrName.toLowerCase() === 'content') {
|
|
return collapseWhitespaceAll(attrValue);
|
|
} else if (options.customAttrCollapse && options.customAttrCollapse.test(attrName)) {
|
|
attrValue = trimWhitespace(attrValue.replace(/ ?[\n\r]+ ?/g, '').replace(/\s{2,}/g, options.conservativeCollapse ? ' ' : ''));
|
|
} else if (tag === 'script' && attrName === 'type') {
|
|
attrValue = trimWhitespace(attrValue.replace(/\s*;\s*/g, ';'));
|
|
} else if (isMediaQuery(tag, attrs, attrName)) {
|
|
attrValue = trimWhitespace(attrValue);
|
|
return options.minifyCSS(attrValue, 'media');
|
|
}
|
|
return attrValue;
|
|
}
|
|
|
|
function isMetaViewport(tag, attrs) {
|
|
if (tag !== 'meta') {
|
|
return false;
|
|
}
|
|
for (let i = 0, len = attrs.length; i < len; i++) {
|
|
if (attrs[i].name === 'name' && attrs[i].value === 'viewport') {
|
|
return true;
|
|
}
|
|
}
|
|
}
|
|
|
|
function isContentSecurityPolicy(tag, attrs) {
|
|
if (tag !== 'meta') {
|
|
return false;
|
|
}
|
|
for (let i = 0, len = attrs.length; i < len; i++) {
|
|
if (attrs[i].name.toLowerCase() === 'http-equiv' && attrs[i].value.toLowerCase() === 'content-security-policy') {
|
|
return true;
|
|
}
|
|
}
|
|
}
|
|
|
|
function ignoreCSS(id) {
|
|
return '/* clean-css ignore:start */' + id + '/* clean-css ignore:end */';
|
|
}
|
|
|
|
// Wrap CSS declarations for CleanCSS > 3.x
|
|
// See https://github.com/jakubpawlowicz/clean-css/issues/418
|
|
function wrapCSS(text, type) {
|
|
switch (type) {
|
|
case 'inline':
|
|
return '*{' + text + '}';
|
|
case 'media':
|
|
return '@media ' + text + '{a{top:0}}';
|
|
default:
|
|
return text;
|
|
}
|
|
}
|
|
|
|
function unwrapCSS(text, type) {
|
|
let matches;
|
|
switch (type) {
|
|
case 'inline':
|
|
matches = text.match(/^\*\{([\s\S]*)\}$/);
|
|
break;
|
|
case 'media':
|
|
matches = text.match(/^@media ([\s\S]*?)\s*{[\s\S]*}$/);
|
|
break;
|
|
}
|
|
return matches ? matches[1] : text;
|
|
}
|
|
|
|
async function cleanConditionalComment(comment, options) {
|
|
return options.processConditionalComments
|
|
? await replaceAsync(comment, /^(\[if\s[^\]]+]>)([\s\S]*?)(<!\[endif])$/, async function (match, prefix, text, suffix) {
|
|
return prefix + await minifyHTML(text, options, true) + suffix;
|
|
})
|
|
: comment;
|
|
}
|
|
|
|
async function processScript(text, options, currentAttrs) {
|
|
for (let i = 0, len = currentAttrs.length; i < len; i++) {
|
|
if (currentAttrs[i].name.toLowerCase() === 'type' &&
|
|
options.processScripts.indexOf(currentAttrs[i].value) > -1) {
|
|
return await minifyHTML(text, options);
|
|
}
|
|
}
|
|
return text;
|
|
}
|
|
|
|
// Tag omission rules from https://html.spec.whatwg.org/multipage/syntax.html#optional-tags
|
|
// with the following deviations:
|
|
// - retain <body> if followed by <noscript>
|
|
// - </rb>, </rt>, </rtc>, </rp> & </tfoot> follow https://www.w3.org/TR/html5/syntax.html#optional-tags
|
|
// - retain all tags which are adjacent to non-standard HTML tags
|
|
const optionalStartTags = new Set(['html', 'head', 'body', 'colgroup', 'tbody']);
|
|
const optionalEndTags = new Set(['html', 'head', 'body', 'li', 'dt', 'dd', 'p', 'rb', 'rt', 'rtc', 'rp', 'optgroup', 'option', 'colgroup', 'caption', 'thead', 'tbody', 'tfoot', 'tr', 'td', 'th']);
|
|
const headerTags = new Set(['meta', 'link', 'script', 'style', 'template', 'noscript']);
|
|
const descriptionTags = new Set(['dt', 'dd']);
|
|
const pBlockTags = new Set(['address', 'article', 'aside', 'blockquote', 'details', 'div', 'dl', 'fieldset', 'figcaption', 'figure', 'footer', 'form', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'header', 'hgroup', 'hr', 'main', 'menu', 'nav', 'ol', 'p', 'pre', 'section', 'table', 'ul']);
|
|
const pInlineTags = new Set(['a', 'audio', 'del', 'ins', 'map', 'noscript', 'video']);
|
|
const rubyTags = new Set(['rb', 'rt', 'rtc', 'rp']);
|
|
const rtcTag = new Set(['rb', 'rtc', 'rp']);
|
|
const optionTag = new Set(['option', 'optgroup']);
|
|
const tableContentTags = new Set(['tbody', 'tfoot']);
|
|
const tableSectionTags = new Set(['thead', 'tbody', 'tfoot']);
|
|
const cellTags = new Set(['td', 'th']);
|
|
const topLevelTags = new Set(['html', 'head', 'body']);
|
|
const compactTags = new Set(['html', 'body']);
|
|
const looseTags = new Set(['head', 'colgroup', 'caption']);
|
|
const trailingTags = new Set(['dt', 'thead']);
|
|
const htmlTags = new Set(['a', 'abbr', 'acronym', 'address', 'applet', 'area', 'article', 'aside', 'audio', 'b', 'base', 'basefont', 'bdi', 'bdo', 'bgsound', 'big', 'blink', 'blockquote', 'body', 'br', 'button', 'canvas', 'caption', 'center', 'cite', 'code', 'col', 'colgroup', 'command', 'content', 'data', 'datalist', 'dd', 'del', 'details', 'dfn', 'dialog', 'dir', 'div', 'dl', 'dt', 'element', 'em', 'embed', 'fieldset', 'figcaption', 'figure', 'font', 'footer', 'form', 'frame', 'frameset', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'head', 'header', 'hgroup', 'hr', 'html', 'i', 'iframe', 'image', 'img', 'input', 'ins', 'isindex', 'kbd', 'keygen', 'label', 'legend', 'li', 'link', 'listing', 'main', 'map', 'mark', 'marquee', 'menu', 'menuitem', 'meta', 'meter', 'multicol', 'nav', 'nobr', 'noembed', 'noframes', 'noscript', 'object', 'ol', 'optgroup', 'option', 'output', 'p', 'param', 'picture', 'plaintext', 'pre', 'progress', 'q', 'rb', 'rp', 'rt', 'rtc', 'ruby', 's', 'samp', 'script', 'section', 'select', 'shadow', 'small', 'source', 'spacer', 'span', 'strike', 'strong', 'style', 'sub', 'summary', 'sup', 'table', 'tbody', 'td', 'template', 'textarea', 'tfoot', 'th', 'thead', 'time', 'title', 'tr', 'track', 'tt', 'u', 'ul', 'var', 'video', 'wbr', 'xmp']);
|
|
|
|
function canRemoveParentTag(optionalStartTag, tag) {
|
|
switch (optionalStartTag) {
|
|
case 'html':
|
|
case 'head':
|
|
return true;
|
|
case 'body':
|
|
return !headerTags.has(tag);
|
|
case 'colgroup':
|
|
return tag === 'col';
|
|
case 'tbody':
|
|
return tag === 'tr';
|
|
}
|
|
return false;
|
|
}
|
|
|
|
function isStartTagMandatory(optionalEndTag, tag) {
|
|
switch (tag) {
|
|
case 'colgroup':
|
|
return optionalEndTag === 'colgroup';
|
|
case 'tbody':
|
|
return tableSectionTags.has(optionalEndTag);
|
|
}
|
|
return false;
|
|
}
|
|
|
|
function canRemovePrecedingTag(optionalEndTag, tag) {
|
|
switch (optionalEndTag) {
|
|
case 'html':
|
|
case 'head':
|
|
case 'body':
|
|
case 'colgroup':
|
|
case 'caption':
|
|
return true;
|
|
case 'li':
|
|
case 'optgroup':
|
|
case 'tr':
|
|
return tag === optionalEndTag;
|
|
case 'dt':
|
|
case 'dd':
|
|
return descriptionTags.has(tag);
|
|
case 'p':
|
|
return pBlockTags.has(tag);
|
|
case 'rb':
|
|
case 'rt':
|
|
case 'rp':
|
|
return rubyTags.has(tag);
|
|
case 'rtc':
|
|
return rtcTag.has(tag);
|
|
case 'option':
|
|
return optionTag.has(tag);
|
|
case 'thead':
|
|
case 'tbody':
|
|
return tableContentTags.has(tag);
|
|
case 'tfoot':
|
|
return tag === 'tbody';
|
|
case 'td':
|
|
case 'th':
|
|
return cellTags.has(tag);
|
|
}
|
|
return false;
|
|
}
|
|
|
|
const reEmptyAttribute = new RegExp(
|
|
'^(?:class|id|style|title|lang|dir|on(?:focus|blur|change|click|dblclick|mouse(' +
|
|
'?:down|up|over|move|out)|key(?:press|down|up)))$');
|
|
|
|
function canDeleteEmptyAttribute(tag, attrName, attrValue, options) {
|
|
const isValueEmpty = !attrValue || /^\s*$/.test(attrValue);
|
|
if (!isValueEmpty) {
|
|
return false;
|
|
}
|
|
if (typeof options.removeEmptyAttributes === 'function') {
|
|
return options.removeEmptyAttributes(attrName, tag);
|
|
}
|
|
return (tag === 'input' && attrName === 'value') || reEmptyAttribute.test(attrName);
|
|
}
|
|
|
|
function hasAttrName(name, attrs) {
|
|
for (let i = attrs.length - 1; i >= 0; i--) {
|
|
if (attrs[i].name === name) {
|
|
return true;
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
function canRemoveElement(tag, attrs) {
|
|
switch (tag) {
|
|
case 'textarea':
|
|
return false;
|
|
case 'audio':
|
|
case 'script':
|
|
case 'video':
|
|
if (hasAttrName('src', attrs)) {
|
|
return false;
|
|
}
|
|
break;
|
|
case 'iframe':
|
|
if (hasAttrName('src', attrs) || hasAttrName('srcdoc', attrs)) {
|
|
return false;
|
|
}
|
|
break;
|
|
case 'object':
|
|
if (hasAttrName('data', attrs)) {
|
|
return false;
|
|
}
|
|
break;
|
|
case 'applet':
|
|
if (hasAttrName('code', attrs)) {
|
|
return false;
|
|
}
|
|
break;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
function canCollapseWhitespace(tag) {
|
|
return !/^(?:script|style|pre|textarea)$/.test(tag);
|
|
}
|
|
|
|
function canTrimWhitespace(tag) {
|
|
return !/^(?:pre|textarea)$/.test(tag);
|
|
}
|
|
|
|
async function normalizeAttr(attr, attrs, tag, options) {
|
|
const attrName = options.name(attr.name);
|
|
let attrValue = attr.value;
|
|
|
|
if (options.decodeEntities && attrValue) {
|
|
attrValue = decodeHTMLStrict(attrValue);
|
|
}
|
|
|
|
if ((options.removeRedundantAttributes &&
|
|
isAttributeRedundant(tag, attrName, attrValue, attrs)) ||
|
|
(options.removeScriptTypeAttributes && tag === 'script' &&
|
|
attrName === 'type' && isScriptTypeAttribute(attrValue) && !keepScriptTypeAttribute(attrValue)) ||
|
|
(options.removeStyleLinkTypeAttributes && (tag === 'style' || tag === 'link') &&
|
|
attrName === 'type' && isStyleLinkTypeAttribute(attrValue))) {
|
|
return;
|
|
}
|
|
|
|
if (attrValue) {
|
|
attrValue = await cleanAttributeValue(tag, attrName, attrValue, options, attrs);
|
|
}
|
|
|
|
if (options.removeEmptyAttributes &&
|
|
canDeleteEmptyAttribute(tag, attrName, attrValue, options)) {
|
|
return;
|
|
}
|
|
|
|
if (options.decodeEntities && attrValue) {
|
|
attrValue = attrValue.replace(/&(#?[0-9a-zA-Z]+;)/g, '&$1');
|
|
}
|
|
|
|
return {
|
|
attr,
|
|
name: attrName,
|
|
value: attrValue
|
|
};
|
|
}
|
|
|
|
function buildAttr(normalized, hasUnarySlash, options, isLast, uidAttr) {
|
|
const attrName = normalized.name;
|
|
let attrValue = normalized.value;
|
|
const attr = normalized.attr;
|
|
let attrQuote = attr.quote;
|
|
let attrFragment;
|
|
let emittedAttrValue;
|
|
|
|
if (typeof attrValue !== 'undefined' && (!options.removeAttributeQuotes ||
|
|
~attrValue.indexOf(uidAttr) || !canRemoveAttributeQuotes(attrValue))) {
|
|
if (!options.preventAttributesEscaping) {
|
|
if (typeof options.quoteCharacter === 'undefined') {
|
|
const apos = (attrValue.match(/'/g) || []).length;
|
|
const quot = (attrValue.match(/"/g) || []).length;
|
|
attrQuote = apos < quot ? '\'' : '"';
|
|
} else {
|
|
attrQuote = options.quoteCharacter === '\'' ? '\'' : '"';
|
|
}
|
|
if (attrQuote === '"') {
|
|
attrValue = attrValue.replace(/"/g, '"');
|
|
} else {
|
|
attrValue = attrValue.replace(/'/g, ''');
|
|
}
|
|
}
|
|
emittedAttrValue = attrQuote + attrValue + attrQuote;
|
|
if (!isLast && !options.removeTagWhitespace) {
|
|
emittedAttrValue += ' ';
|
|
}
|
|
} else if (isLast && !hasUnarySlash && !/\/$/.test(attrValue)) {
|
|
// make sure trailing slash is not interpreted as HTML self-closing tag
|
|
emittedAttrValue = attrValue;
|
|
} else {
|
|
emittedAttrValue = attrValue + ' ';
|
|
}
|
|
|
|
if (typeof attrValue === 'undefined' || (options.collapseBooleanAttributes &&
|
|
isBooleanAttribute(attrName.toLowerCase(), attrValue.toLowerCase()))) {
|
|
attrFragment = attrName;
|
|
if (!isLast) {
|
|
attrFragment += ' ';
|
|
}
|
|
} else {
|
|
attrFragment = attrName + attr.customAssign + emittedAttrValue;
|
|
}
|
|
|
|
return attr.customOpen + attrFragment + attr.customClose;
|
|
}
|
|
|
|
function identity(value) {
|
|
return value;
|
|
}
|
|
|
|
function identityAsync(value) {
|
|
return Promise.resolve(value);
|
|
}
|
|
|
|
const processOptions = (inputOptions) => {
|
|
const options = {
|
|
name: function (name) {
|
|
return name.toLowerCase();
|
|
},
|
|
canCollapseWhitespace,
|
|
canTrimWhitespace,
|
|
html5: true,
|
|
ignoreCustomComments: [
|
|
/^!/,
|
|
/^\s*#/
|
|
],
|
|
ignoreCustomFragments: [
|
|
/<%[\s\S]*?%>/,
|
|
/<\?[\s\S]*?\?>/
|
|
],
|
|
includeAutoGeneratedTags: true,
|
|
log: identity,
|
|
minifyCSS: identityAsync,
|
|
minifyJS: identity,
|
|
minifyURLs: identity
|
|
};
|
|
|
|
Object.keys(inputOptions).forEach(function (key) {
|
|
const option = inputOptions[key];
|
|
|
|
if (key === 'caseSensitive') {
|
|
if (option) {
|
|
options.name = identity;
|
|
}
|
|
} else if (key === 'log') {
|
|
if (typeof option === 'function') {
|
|
options.log = option;
|
|
}
|
|
} else if (key === 'minifyCSS' && typeof option !== 'function') {
|
|
if (!option) {
|
|
return;
|
|
}
|
|
|
|
const cleanCssOptions = typeof option === 'object' ? option : {};
|
|
|
|
options.minifyCSS = async function (text, type) {
|
|
text = text.replace(/(url\s*\(\s*)("|'|)(.*?)\2(\s*\))/ig, function (match, prefix, quote, url, suffix) {
|
|
return prefix + quote + options.minifyURLs(url) + quote + suffix;
|
|
});
|
|
|
|
const inputCSS = wrapCSS(text, type);
|
|
|
|
return new Promise((resolve) => {
|
|
new CleanCSS(cleanCssOptions).minify(inputCSS, (_err, output) => {
|
|
if (output.errors.length > 0) {
|
|
output.errors.forEach(options.log);
|
|
resolve(text);
|
|
}
|
|
|
|
const outputCSS = unwrapCSS(output.styles, type);
|
|
resolve(outputCSS);
|
|
});
|
|
});
|
|
};
|
|
} else if (key === 'minifyJS' && typeof option !== 'function') {
|
|
if (!option) {
|
|
return;
|
|
}
|
|
|
|
const terserOptions = typeof option === 'object' ? option : {};
|
|
|
|
terserOptions.parse = {
|
|
...terserOptions.parse,
|
|
bare_returns: false
|
|
};
|
|
|
|
options.minifyJS = async function (text, inline) {
|
|
const start = text.match(/^\s*<!--.*/);
|
|
const code = start ? text.slice(start[0].length).replace(/\n\s*-->\s*$/, '') : text;
|
|
|
|
terserOptions.parse.bare_returns = inline;
|
|
|
|
try {
|
|
const result = await terser(code, terserOptions);
|
|
return result.code.replace(/;$/, '');
|
|
} catch (error) {
|
|
options.log(error);
|
|
return text;
|
|
}
|
|
};
|
|
} else if (key === 'minifyURLs' && typeof option !== 'function') {
|
|
if (!option) {
|
|
return;
|
|
}
|
|
|
|
let relateUrlOptions = option;
|
|
|
|
if (typeof option === 'string') {
|
|
relateUrlOptions = { site: option };
|
|
} else if (typeof option !== 'object') {
|
|
relateUrlOptions = {};
|
|
}
|
|
|
|
options.minifyURLs = function (text) {
|
|
try {
|
|
return RelateURL.relate(text, relateUrlOptions);
|
|
} catch (err) {
|
|
options.log(err);
|
|
return text;
|
|
}
|
|
};
|
|
} else {
|
|
options[key] = option;
|
|
}
|
|
});
|
|
return options;
|
|
};
|
|
|
|
function uniqueId(value) {
|
|
let id;
|
|
do {
|
|
id = Math.random().toString(36).replace(/^0\.[0-9]*/, '');
|
|
} while (~value.indexOf(id));
|
|
return id;
|
|
}
|
|
|
|
const specialContentTags = new Set(['script', 'style']);
|
|
|
|
async function createSortFns(value, options, uidIgnore, uidAttr) {
|
|
const attrChains = options.sortAttributes && Object.create(null);
|
|
const classChain = options.sortClassName && new TokenChain();
|
|
|
|
function attrNames(attrs) {
|
|
return attrs.map(function (attr) {
|
|
return options.name(attr.name);
|
|
});
|
|
}
|
|
|
|
function shouldSkipUID(token, uid) {
|
|
return !uid || token.indexOf(uid) === -1;
|
|
}
|
|
|
|
function shouldSkipUIDs(token) {
|
|
return shouldSkipUID(token, uidIgnore) && shouldSkipUID(token, uidAttr);
|
|
}
|
|
|
|
async function scan(input) {
|
|
let currentTag, currentType;
|
|
const parser = new HTMLParser(input, {
|
|
start: function (tag, attrs) {
|
|
if (attrChains) {
|
|
if (!attrChains[tag]) {
|
|
attrChains[tag] = new TokenChain();
|
|
}
|
|
attrChains[tag].add(attrNames(attrs).filter(shouldSkipUIDs));
|
|
}
|
|
for (let i = 0, len = attrs.length; i < len; i++) {
|
|
const attr = attrs[i];
|
|
if (classChain && attr.value && options.name(attr.name) === 'class') {
|
|
classChain.add(trimWhitespace(attr.value).split(/[ \t\n\f\r]+/).filter(shouldSkipUIDs));
|
|
} else if (options.processScripts && attr.name.toLowerCase() === 'type') {
|
|
currentTag = tag;
|
|
currentType = attr.value;
|
|
}
|
|
}
|
|
},
|
|
end: function () {
|
|
currentTag = '';
|
|
},
|
|
chars: async function (text) {
|
|
if (options.processScripts && specialContentTags.has(currentTag) &&
|
|
options.processScripts.indexOf(currentType) > -1) {
|
|
await scan(text);
|
|
}
|
|
}
|
|
});
|
|
|
|
await parser.parse();
|
|
}
|
|
|
|
const log = options.log;
|
|
options.log = identity;
|
|
options.sortAttributes = false;
|
|
options.sortClassName = false;
|
|
await scan(await minifyHTML(value, options));
|
|
options.log = log;
|
|
if (attrChains) {
|
|
const attrSorters = Object.create(null);
|
|
for (const tag in attrChains) {
|
|
attrSorters[tag] = attrChains[tag].createSorter();
|
|
}
|
|
options.sortAttributes = function (tag, attrs) {
|
|
const sorter = attrSorters[tag];
|
|
if (sorter) {
|
|
const attrMap = Object.create(null);
|
|
const names = attrNames(attrs);
|
|
names.forEach(function (name, index) {
|
|
(attrMap[name] || (attrMap[name] = [])).push(attrs[index]);
|
|
});
|
|
sorter.sort(names).forEach(function (name, index) {
|
|
attrs[index] = attrMap[name].shift();
|
|
});
|
|
}
|
|
};
|
|
}
|
|
if (classChain) {
|
|
const sorter = classChain.createSorter();
|
|
options.sortClassName = function (value) {
|
|
return sorter.sort(value.split(/[ \n\f\r]+/)).join(' ');
|
|
};
|
|
}
|
|
}
|
|
|
|
async function minifyHTML(value, options, partialMarkup) {
|
|
if (options.collapseWhitespace) {
|
|
value = collapseWhitespace(value, options, true, true);
|
|
}
|
|
|
|
const buffer = [];
|
|
let charsPrevTag;
|
|
let currentChars = '';
|
|
let hasChars;
|
|
let currentTag = '';
|
|
let currentAttrs = [];
|
|
const stackNoTrimWhitespace = [];
|
|
const stackNoCollapseWhitespace = [];
|
|
let optionalStartTag = '';
|
|
let optionalEndTag = '';
|
|
const ignoredMarkupChunks = [];
|
|
const ignoredCustomMarkupChunks = [];
|
|
let uidIgnore;
|
|
let uidAttr;
|
|
let uidPattern;
|
|
|
|
// temporarily replace ignored chunks with comments,
|
|
// so that we don't have to worry what's there.
|
|
// for all we care there might be
|
|
// completely-horribly-broken-alien-non-html-emoj-cthulhu-filled content
|
|
value = value.replace(/<!-- htmlmin:ignore -->([\s\S]*?)<!-- htmlmin:ignore -->/g, function (match, group1) {
|
|
if (!uidIgnore) {
|
|
uidIgnore = uniqueId(value);
|
|
const pattern = new RegExp('^' + uidIgnore + '([0-9]+)$');
|
|
if (options.ignoreCustomComments) {
|
|
options.ignoreCustomComments = options.ignoreCustomComments.slice();
|
|
} else {
|
|
options.ignoreCustomComments = [];
|
|
}
|
|
options.ignoreCustomComments.push(pattern);
|
|
}
|
|
const token = '<!--' + uidIgnore + ignoredMarkupChunks.length + '-->';
|
|
ignoredMarkupChunks.push(group1);
|
|
return token;
|
|
});
|
|
|
|
const customFragments = options.ignoreCustomFragments.map(function (re) {
|
|
return re.source;
|
|
});
|
|
if (customFragments.length) {
|
|
const reCustomIgnore = new RegExp('\\s*(?:' + customFragments.join('|') + ')+\\s*', 'g');
|
|
// temporarily replace custom ignored fragments with unique attributes
|
|
value = value.replace(reCustomIgnore, function (match) {
|
|
if (!uidAttr) {
|
|
uidAttr = uniqueId(value);
|
|
uidPattern = new RegExp('(\\s*)' + uidAttr + '([0-9]+)' + uidAttr + '(\\s*)', 'g');
|
|
|
|
if (options.minifyCSS) {
|
|
options.minifyCSS = (function (fn) {
|
|
return function (text, type) {
|
|
text = text.replace(uidPattern, function (match, prefix, index) {
|
|
const chunks = ignoredCustomMarkupChunks[+index];
|
|
return chunks[1] + uidAttr + index + uidAttr + chunks[2];
|
|
});
|
|
|
|
const ids = [];
|
|
new CleanCSS().minify(wrapCSS(text, type)).warnings.forEach(function (warning) {
|
|
const match = uidPattern.exec(warning);
|
|
if (match) {
|
|
const id = uidAttr + match[2] + uidAttr;
|
|
text = text.replace(id, ignoreCSS(id));
|
|
ids.push(id);
|
|
}
|
|
});
|
|
|
|
return fn(text, type).then(chunk => {
|
|
ids.forEach(function (id) {
|
|
chunk = chunk.replace(ignoreCSS(id), id);
|
|
});
|
|
|
|
return chunk;
|
|
});
|
|
};
|
|
})(options.minifyCSS);
|
|
}
|
|
|
|
if (options.minifyJS) {
|
|
options.minifyJS = (function (fn) {
|
|
return function (text, type) {
|
|
return fn(text.replace(uidPattern, function (match, prefix, index) {
|
|
const chunks = ignoredCustomMarkupChunks[+index];
|
|
return chunks[1] + uidAttr + index + uidAttr + chunks[2];
|
|
}), type);
|
|
};
|
|
})(options.minifyJS);
|
|
}
|
|
}
|
|
|
|
const token = uidAttr + ignoredCustomMarkupChunks.length + uidAttr;
|
|
ignoredCustomMarkupChunks.push(/^(\s*)[\s\S]*?(\s*)$/.exec(match));
|
|
return '\t' + token + '\t';
|
|
});
|
|
}
|
|
|
|
if ((options.sortAttributes && typeof options.sortAttributes !== 'function') ||
|
|
(options.sortClassName && typeof options.sortClassName !== 'function')) {
|
|
await createSortFns(value, options, uidIgnore, uidAttr);
|
|
}
|
|
|
|
function _canCollapseWhitespace(tag, attrs) {
|
|
return options.canCollapseWhitespace(tag, attrs, canCollapseWhitespace);
|
|
}
|
|
|
|
function _canTrimWhitespace(tag, attrs) {
|
|
return options.canTrimWhitespace(tag, attrs, canTrimWhitespace);
|
|
}
|
|
|
|
function removeStartTag() {
|
|
let index = buffer.length - 1;
|
|
while (index > 0 && !/^<[^/!]/.test(buffer[index])) {
|
|
index--;
|
|
}
|
|
buffer.length = Math.max(0, index);
|
|
}
|
|
|
|
function removeEndTag() {
|
|
let index = buffer.length - 1;
|
|
while (index > 0 && !/^<\//.test(buffer[index])) {
|
|
index--;
|
|
}
|
|
buffer.length = Math.max(0, index);
|
|
}
|
|
|
|
// look for trailing whitespaces, bypass any inline tags
|
|
function trimTrailingWhitespace(index, nextTag) {
|
|
for (let endTag = null; index >= 0 && _canTrimWhitespace(endTag); index--) {
|
|
const str = buffer[index];
|
|
const match = str.match(/^<\/([\w:-]+)>$/);
|
|
if (match) {
|
|
endTag = match[1];
|
|
} else if (/>$/.test(str) || (buffer[index] = collapseWhitespaceSmart(str, null, nextTag, options))) {
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
// look for trailing whitespaces from previously processed text
|
|
// which may not be trimmed due to a following comment or an empty
|
|
// element which has now been removed
|
|
function squashTrailingWhitespace(nextTag) {
|
|
let charsIndex = buffer.length - 1;
|
|
if (buffer.length > 1) {
|
|
const item = buffer[buffer.length - 1];
|
|
if (/^(?:<!|$)/.test(item) && item.indexOf(uidIgnore) === -1) {
|
|
charsIndex--;
|
|
}
|
|
}
|
|
trimTrailingWhitespace(charsIndex, nextTag);
|
|
}
|
|
|
|
const parser = new HTMLParser(value, {
|
|
partialMarkup,
|
|
continueOnParseError: options.continueOnParseError,
|
|
customAttrAssign: options.customAttrAssign,
|
|
customAttrSurround: options.customAttrSurround,
|
|
html5: options.html5,
|
|
|
|
start: async function (tag, attrs, unary, unarySlash, autoGenerated) {
|
|
if (tag.toLowerCase() === 'svg') {
|
|
options = Object.create(options);
|
|
options.caseSensitive = true;
|
|
options.keepClosingSlash = true;
|
|
options.name = identity;
|
|
}
|
|
tag = options.name(tag);
|
|
currentTag = tag;
|
|
charsPrevTag = tag;
|
|
if (!inlineTextTags.has(tag)) {
|
|
currentChars = '';
|
|
}
|
|
hasChars = false;
|
|
currentAttrs = attrs;
|
|
|
|
let optional = options.removeOptionalTags;
|
|
if (optional) {
|
|
const htmlTag = htmlTags.has(tag);
|
|
// <html> may be omitted if first thing inside is not comment
|
|
// <head> may be omitted if first thing inside is an element
|
|
// <body> may be omitted if first thing inside is not space, comment, <meta>, <link>, <script>, <style> or <template>
|
|
// <colgroup> may be omitted if first thing inside is <col>
|
|
// <tbody> may be omitted if first thing inside is <tr>
|
|
if (htmlTag && canRemoveParentTag(optionalStartTag, tag)) {
|
|
removeStartTag();
|
|
}
|
|
optionalStartTag = '';
|
|
// end-tag-followed-by-start-tag omission rules
|
|
if (htmlTag && canRemovePrecedingTag(optionalEndTag, tag)) {
|
|
removeEndTag();
|
|
// <colgroup> cannot be omitted if preceding </colgroup> is omitted
|
|
// <tbody> cannot be omitted if preceding </tbody>, </thead> or </tfoot> is omitted
|
|
optional = !isStartTagMandatory(optionalEndTag, tag);
|
|
}
|
|
optionalEndTag = '';
|
|
}
|
|
|
|
// set whitespace flags for nested tags (eg. <code> within a <pre>)
|
|
if (options.collapseWhitespace) {
|
|
if (!stackNoTrimWhitespace.length) {
|
|
squashTrailingWhitespace(tag);
|
|
}
|
|
if (!unary) {
|
|
if (!_canTrimWhitespace(tag, attrs) || stackNoTrimWhitespace.length) {
|
|
stackNoTrimWhitespace.push(tag);
|
|
}
|
|
if (!_canCollapseWhitespace(tag, attrs) || stackNoCollapseWhitespace.length) {
|
|
stackNoCollapseWhitespace.push(tag);
|
|
}
|
|
}
|
|
}
|
|
|
|
const openTag = '<' + tag;
|
|
const hasUnarySlash = unarySlash && options.keepClosingSlash;
|
|
|
|
buffer.push(openTag);
|
|
|
|
if (options.sortAttributes) {
|
|
options.sortAttributes(tag, attrs);
|
|
}
|
|
|
|
const parts = [];
|
|
for (let i = attrs.length, isLast = true; --i >= 0;) {
|
|
const normalized = await normalizeAttr(attrs[i], attrs, tag, options);
|
|
if (normalized) {
|
|
parts.unshift(buildAttr(normalized, hasUnarySlash, options, isLast, uidAttr));
|
|
isLast = false;
|
|
}
|
|
}
|
|
if (parts.length > 0) {
|
|
buffer.push(' ');
|
|
buffer.push.apply(buffer, parts);
|
|
} else if (optional && optionalStartTags.has(tag)) {
|
|
// start tag must never be omitted if it has any attributes
|
|
optionalStartTag = tag;
|
|
}
|
|
|
|
buffer.push(buffer.pop() + (hasUnarySlash ? '/' : '') + '>');
|
|
|
|
if (autoGenerated && !options.includeAutoGeneratedTags) {
|
|
removeStartTag();
|
|
optionalStartTag = '';
|
|
}
|
|
},
|
|
end: function (tag, attrs, autoGenerated) {
|
|
if (tag.toLowerCase() === 'svg') {
|
|
options = Object.getPrototypeOf(options);
|
|
}
|
|
tag = options.name(tag);
|
|
|
|
// check if current tag is in a whitespace stack
|
|
if (options.collapseWhitespace) {
|
|
if (stackNoTrimWhitespace.length) {
|
|
if (tag === stackNoTrimWhitespace[stackNoTrimWhitespace.length - 1]) {
|
|
stackNoTrimWhitespace.pop();
|
|
}
|
|
} else {
|
|
squashTrailingWhitespace('/' + tag);
|
|
}
|
|
if (stackNoCollapseWhitespace.length &&
|
|
tag === stackNoCollapseWhitespace[stackNoCollapseWhitespace.length - 1]) {
|
|
stackNoCollapseWhitespace.pop();
|
|
}
|
|
}
|
|
|
|
let isElementEmpty = false;
|
|
if (tag === currentTag) {
|
|
currentTag = '';
|
|
isElementEmpty = !hasChars;
|
|
}
|
|
|
|
if (options.removeOptionalTags) {
|
|
// <html>, <head> or <body> may be omitted if the element is empty
|
|
if (isElementEmpty && topLevelTags.has(optionalStartTag)) {
|
|
removeStartTag();
|
|
}
|
|
optionalStartTag = '';
|
|
// </html> or </body> may be omitted if not followed by comment
|
|
// </head> may be omitted if not followed by space or comment
|
|
// </p> may be omitted if no more content in non-</a> parent
|
|
// except for </dt> or </thead>, end tags may be omitted if no more content in parent element
|
|
if (htmlTags.has(tag) && optionalEndTag && !trailingTags.has(optionalEndTag) && (optionalEndTag !== 'p' || !pInlineTags.has(tag))) {
|
|
removeEndTag();
|
|
}
|
|
optionalEndTag = optionalEndTags.has(tag) ? tag : '';
|
|
}
|
|
|
|
if (options.removeEmptyElements && isElementEmpty && canRemoveElement(tag, attrs)) {
|
|
// remove last "element" from buffer
|
|
removeStartTag();
|
|
optionalStartTag = '';
|
|
optionalEndTag = '';
|
|
} else {
|
|
if (autoGenerated && !options.includeAutoGeneratedTags) {
|
|
optionalEndTag = '';
|
|
} else {
|
|
buffer.push('</' + tag + '>');
|
|
}
|
|
charsPrevTag = '/' + tag;
|
|
if (!inlineTags.has(tag)) {
|
|
currentChars = '';
|
|
} else if (isElementEmpty) {
|
|
currentChars += '|';
|
|
}
|
|
}
|
|
},
|
|
chars: async function (text, prevTag, nextTag) {
|
|
prevTag = prevTag === '' ? 'comment' : prevTag;
|
|
nextTag = nextTag === '' ? 'comment' : nextTag;
|
|
if (options.decodeEntities && text && !specialContentTags.has(currentTag)) {
|
|
text = decodeHTML(text);
|
|
}
|
|
if (options.collapseWhitespace) {
|
|
if (!stackNoTrimWhitespace.length) {
|
|
if (prevTag === 'comment') {
|
|
const prevComment = buffer[buffer.length - 1];
|
|
if (prevComment.indexOf(uidIgnore) === -1) {
|
|
if (!prevComment) {
|
|
prevTag = charsPrevTag;
|
|
}
|
|
if (buffer.length > 1 && (!prevComment || (!options.conservativeCollapse && / $/.test(currentChars)))) {
|
|
const charsIndex = buffer.length - 2;
|
|
buffer[charsIndex] = buffer[charsIndex].replace(/\s+$/, function (trailingSpaces) {
|
|
text = trailingSpaces + text;
|
|
return '';
|
|
});
|
|
}
|
|
}
|
|
}
|
|
if (prevTag) {
|
|
if (prevTag === '/nobr' || prevTag === 'wbr') {
|
|
if (/^\s/.test(text)) {
|
|
let tagIndex = buffer.length - 1;
|
|
while (tagIndex > 0 && buffer[tagIndex].lastIndexOf('<' + prevTag) !== 0) {
|
|
tagIndex--;
|
|
}
|
|
trimTrailingWhitespace(tagIndex - 1, 'br');
|
|
}
|
|
} else if (inlineTextTags.has(prevTag.charAt(0) === '/' ? prevTag.slice(1) : prevTag)) {
|
|
text = collapseWhitespace(text, options, /(?:^|\s)$/.test(currentChars));
|
|
}
|
|
}
|
|
if (prevTag || nextTag) {
|
|
text = collapseWhitespaceSmart(text, prevTag, nextTag, options);
|
|
} else {
|
|
text = collapseWhitespace(text, options, true, true);
|
|
}
|
|
if (!text && /\s$/.test(currentChars) && prevTag && prevTag.charAt(0) === '/') {
|
|
trimTrailingWhitespace(buffer.length - 1, nextTag);
|
|
}
|
|
}
|
|
if (!stackNoCollapseWhitespace.length && nextTag !== 'html' && !(prevTag && nextTag)) {
|
|
text = collapseWhitespace(text, options, false, false, true);
|
|
}
|
|
}
|
|
if (options.processScripts && specialContentTags.has(currentTag)) {
|
|
text = await processScript(text, options, currentAttrs);
|
|
}
|
|
if (isExecutableScript(currentTag, currentAttrs)) {
|
|
text = await options.minifyJS(text);
|
|
}
|
|
if (isStyleSheet(currentTag, currentAttrs)) {
|
|
text = await options.minifyCSS(text);
|
|
}
|
|
if (options.removeOptionalTags && text) {
|
|
// <html> may be omitted if first thing inside is not comment
|
|
// <body> may be omitted if first thing inside is not space, comment, <meta>, <link>, <script>, <style> or <template>
|
|
if (optionalStartTag === 'html' || (optionalStartTag === 'body' && !/^\s/.test(text))) {
|
|
removeStartTag();
|
|
}
|
|
optionalStartTag = '';
|
|
// </html> or </body> may be omitted if not followed by comment
|
|
// </head>, </colgroup> or </caption> may be omitted if not followed by space or comment
|
|
if (compactTags.has(optionalEndTag) || (looseTags.has(optionalEndTag) && !/^\s/.test(text))) {
|
|
removeEndTag();
|
|
}
|
|
optionalEndTag = '';
|
|
}
|
|
charsPrevTag = /^\s*$/.test(text) ? prevTag : 'comment';
|
|
if (options.decodeEntities && text && !specialContentTags.has(currentTag)) {
|
|
// Escape any `&` symbols that start either:
|
|
// 1) a legacy named character reference (i.e. one that doesn't end with `;`)
|
|
// 2) or any other character reference (i.e. one that does end with `;`)
|
|
// Note that `&` can be escaped as `&`, without the semi-colon.
|
|
// https://mathiasbynens.be/notes/ambiguous-ampersands
|
|
text = text.replace(/&((?:Iacute|aacute|uacute|plusmn|Otilde|otilde|agrave|Agrave|Yacute|yacute|Oslash|oslash|atilde|Atilde|brvbar|ccedil|Ccedil|Ograve|curren|divide|eacute|Eacute|ograve|Oacute|egrave|Egrave|Ugrave|frac12|frac14|frac34|ugrave|oacute|iacute|Ntilde|ntilde|Uacute|middot|igrave|Igrave|iquest|Aacute|cedil|laquo|micro|iexcl|Icirc|icirc|acirc|Ucirc|Ecirc|ocirc|Ocirc|ecirc|ucirc|Aring|aring|AElig|aelig|acute|pound|raquo|Acirc|times|THORN|szlig|thorn|COPY|auml|ordf|ordm|Uuml|macr|uuml|Auml|ouml|Ouml|para|nbsp|euml|quot|QUOT|Euml|yuml|cent|sect|copy|sup1|sup2|sup3|iuml|Iuml|ETH|shy|reg|not|yen|amp|AMP|REG|uml|eth|deg|gt|GT|LT|lt)(?!;)|(?:#?[0-9a-zA-Z]+;))/g, '&$1').replace(/</g, '<');
|
|
}
|
|
if (uidPattern && options.collapseWhitespace && stackNoTrimWhitespace.length) {
|
|
text = text.replace(uidPattern, function (match, prefix, index) {
|
|
return ignoredCustomMarkupChunks[+index][0];
|
|
});
|
|
}
|
|
currentChars += text;
|
|
if (text) {
|
|
hasChars = true;
|
|
}
|
|
buffer.push(text);
|
|
},
|
|
comment: async function (text, nonStandard) {
|
|
const prefix = nonStandard ? '<!' : '<!--';
|
|
const suffix = nonStandard ? '>' : '-->';
|
|
if (isConditionalComment(text)) {
|
|
text = prefix + await cleanConditionalComment(text, options) + suffix;
|
|
} else if (options.removeComments) {
|
|
if (isIgnoredComment(text, options)) {
|
|
text = '<!--' + text + '-->';
|
|
} else {
|
|
text = '';
|
|
}
|
|
} else {
|
|
text = prefix + text + suffix;
|
|
}
|
|
if (options.removeOptionalTags && text) {
|
|
// preceding comments suppress tag omissions
|
|
optionalStartTag = '';
|
|
optionalEndTag = '';
|
|
}
|
|
buffer.push(text);
|
|
},
|
|
doctype: function (doctype) {
|
|
buffer.push(options.useShortDoctype
|
|
? '<!doctype' +
|
|
(options.removeTagWhitespace ? '' : ' ') + 'html>'
|
|
: collapseWhitespaceAll(doctype));
|
|
}
|
|
});
|
|
|
|
await parser.parse();
|
|
|
|
if (options.removeOptionalTags) {
|
|
// <html> may be omitted if first thing inside is not comment
|
|
// <head> or <body> may be omitted if empty
|
|
if (topLevelTags.has(optionalStartTag)) {
|
|
removeStartTag();
|
|
}
|
|
// except for </dt> or </thead>, end tags may be omitted if no more content in parent element
|
|
if (optionalEndTag && !trailingTags.has(optionalEndTag)) {
|
|
removeEndTag();
|
|
}
|
|
}
|
|
if (options.collapseWhitespace) {
|
|
squashTrailingWhitespace('br');
|
|
}
|
|
|
|
return joinResultSegments(buffer, options, uidPattern
|
|
? function (str) {
|
|
return str.replace(uidPattern, function (match, prefix, index, suffix) {
|
|
let chunk = ignoredCustomMarkupChunks[+index][0];
|
|
if (options.collapseWhitespace) {
|
|
if (prefix !== '\t') {
|
|
chunk = prefix + chunk;
|
|
}
|
|
if (suffix !== '\t') {
|
|
chunk += suffix;
|
|
}
|
|
return collapseWhitespace(chunk, {
|
|
preserveLineBreaks: options.preserveLineBreaks,
|
|
conservativeCollapse: !options.trimCustomFragments
|
|
}, /^[ \n\r\t\f]/.test(chunk), /[ \n\r\t\f]$/.test(chunk));
|
|
}
|
|
return chunk;
|
|
});
|
|
}
|
|
: identity, uidIgnore
|
|
? function (str) {
|
|
return str.replace(new RegExp('<!--' + uidIgnore + '([0-9]+)-->', 'g'), function (match, index) {
|
|
return ignoredMarkupChunks[+index];
|
|
});
|
|
}
|
|
: identity);
|
|
}
|
|
|
|
function joinResultSegments(results, options, restoreCustom, restoreIgnore) {
|
|
let str;
|
|
const maxLineLength = options.maxLineLength;
|
|
const noNewlinesBeforeTagClose = options.noNewlinesBeforeTagClose;
|
|
|
|
if (maxLineLength) {
|
|
let line = ''; const lines = [];
|
|
while (results.length) {
|
|
const len = line.length;
|
|
const end = results[0].indexOf('\n');
|
|
const isClosingTag = Boolean(results[0].match(endTag));
|
|
const shouldKeepSameLine = noNewlinesBeforeTagClose && isClosingTag;
|
|
|
|
if (end < 0) {
|
|
line += restoreIgnore(restoreCustom(results.shift()));
|
|
} else {
|
|
line += restoreIgnore(restoreCustom(results[0].slice(0, end)));
|
|
results[0] = results[0].slice(end + 1);
|
|
}
|
|
if (len > 0 && line.length > maxLineLength && !shouldKeepSameLine) {
|
|
lines.push(line.slice(0, len));
|
|
line = line.slice(len);
|
|
} else if (end >= 0) {
|
|
lines.push(line);
|
|
line = '';
|
|
}
|
|
}
|
|
if (line) {
|
|
lines.push(line);
|
|
}
|
|
str = lines.join('\n');
|
|
} else {
|
|
str = restoreIgnore(restoreCustom(results.join('')));
|
|
}
|
|
return options.collapseWhitespace ? collapseWhitespace(str, options, true, true) : str;
|
|
}
|
|
|
|
export const minify = async function (value, options) {
|
|
const start = Date.now();
|
|
options = processOptions(options || {});
|
|
const result = await minifyHTML(value, options);
|
|
options.log('minified in: ' + (Date.now() - start) + 'ms');
|
|
return result;
|
|
};
|
|
|
|
export default { minify };
|