UNPKG

17.9 kBJavaScriptView Raw
1/**
2 * @license
3 * Copyright Google LLC All Rights Reserved.
4 *
5 * Use of this source code is governed by an MIT-style license that can be
6 * found in the LICENSE file at https://angular.io/license
7 */
8import { trustedHTMLFromString } from '../util/security/trusted_types';
9/**
10 * This helper is used to get hold of an inert tree of DOM elements containing dirty HTML
11 * that needs sanitizing.
12 * Depending upon browser support we use one of two strategies for doing this.
13 * Default: DOMParser strategy
14 * Fallback: InertDocument strategy
15 */
16export function getInertBodyHelper(defaultDoc) {
17 const inertDocumentHelper = new InertDocumentHelper(defaultDoc);
18 return isDOMParserAvailable() ? new DOMParserHelper(inertDocumentHelper) : inertDocumentHelper;
19}
20/**
21 * Uses DOMParser to create and fill an inert body element.
22 * This is the default strategy used in browsers that support it.
23 */
24class DOMParserHelper {
25 constructor(inertDocumentHelper) {
26 this.inertDocumentHelper = inertDocumentHelper;
27 }
28 getInertBodyElement(html) {
29 // We add these extra elements to ensure that the rest of the content is parsed as expected
30 // e.g. leading whitespace is maintained and tags like `<meta>` do not get hoisted to the
31 // `<head>` tag. Note that the `<body>` tag is closed implicitly to prevent unclosed tags
32 // in `html` from consuming the otherwise explicit `</body>` tag.
33 html = '<body><remove></remove>' + html;
34 try {
35 const body = new window.DOMParser()
36 .parseFromString(trustedHTMLFromString(html), 'text/html')
37 .body;
38 if (body === null) {
39 // In some browsers (e.g. Mozilla/5.0 iPad AppleWebKit Mobile) the `body` property only
40 // becomes available in the following tick of the JS engine. In that case we fall back to
41 // the `inertDocumentHelper` instead.
42 return this.inertDocumentHelper.getInertBodyElement(html);
43 }
44 body.removeChild(body.firstChild);
45 return body;
46 }
47 catch {
48 return null;
49 }
50 }
51}
52/**
53 * Use an HTML5 `template` element, if supported, or an inert body element created via
54 * `createHtmlDocument` to create and fill an inert DOM element.
55 * This is the fallback strategy if the browser does not support DOMParser.
56 */
57class InertDocumentHelper {
58 constructor(defaultDoc) {
59 this.defaultDoc = defaultDoc;
60 this.inertDocument = this.defaultDoc.implementation.createHTMLDocument('sanitization-inert');
61 if (this.inertDocument.body == null) {
62 // usually there should be only one body element in the document, but IE doesn't have any, so
63 // we need to create one.
64 const inertHtml = this.inertDocument.createElement('html');
65 this.inertDocument.appendChild(inertHtml);
66 const inertBodyElement = this.inertDocument.createElement('body');
67 inertHtml.appendChild(inertBodyElement);
68 }
69 }
70 getInertBodyElement(html) {
71 // Prefer using <template> element if supported.
72 const templateEl = this.inertDocument.createElement('template');
73 if ('content' in templateEl) {
74 templateEl.innerHTML = trustedHTMLFromString(html);
75 return templateEl;
76 }
77 // Note that previously we used to do something like `this.inertDocument.body.innerHTML = html`
78 // and we returned the inert `body` node. This was changed, because IE seems to treat setting
79 // `innerHTML` on an inserted element differently, compared to one that hasn't been inserted
80 // yet. In particular, IE appears to split some of the text into multiple text nodes rather
81 // than keeping them in a single one which ends up messing with Ivy's i18n parsing further
82 // down the line. This has been worked around by creating a new inert `body` and using it as
83 // the root node in which we insert the HTML.
84 const inertBody = this.inertDocument.createElement('body');
85 inertBody.innerHTML = trustedHTMLFromString(html);
86 // Support: IE 11 only
87 // strip custom-namespaced attributes on IE<=11
88 if (this.defaultDoc.documentMode) {
89 this.stripCustomNsAttrs(inertBody);
90 }
91 return inertBody;
92 }
93 /**
94 * When IE11 comes across an unknown namespaced attribute e.g. 'xlink:foo' it adds 'xmlns:ns1'
95 * attribute to declare ns1 namespace and prefixes the attribute with 'ns1' (e.g.
96 * 'ns1:xlink:foo').
97 *
98 * This is undesirable since we don't want to allow any of these custom attributes. This method
99 * strips them all.
100 */
101 stripCustomNsAttrs(el) {
102 const elAttrs = el.attributes;
103 // loop backwards so that we can support removals.
104 for (let i = elAttrs.length - 1; 0 < i; i--) {
105 const attrib = elAttrs.item(i);
106 const attrName = attrib.name;
107 if (attrName === 'xmlns:ns1' || attrName.indexOf('ns1:') === 0) {
108 el.removeAttribute(attrName);
109 }
110 }
111 let childNode = el.firstChild;
112 while (childNode) {
113 if (childNode.nodeType === Node.ELEMENT_NODE)
114 this.stripCustomNsAttrs(childNode);
115 childNode = childNode.nextSibling;
116 }
117 }
118}
119/**
120 * We need to determine whether the DOMParser exists in the global context and
121 * supports parsing HTML; HTML parsing support is not as wide as other formats, see
122 * https://developer.mozilla.org/en-US/docs/Web/API/DOMParser#Browser_compatibility.
123 *
124 * @suppress {uselessCode}
125 */
126export function isDOMParserAvailable() {
127 try {
128 return !!new window.DOMParser().parseFromString(trustedHTMLFromString(''), 'text/html');
129 }
130 catch {
131 return false;
132 }
133}
134//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"inert_body.js","sourceRoot":"","sources":["../../../../../../../packages/core/src/sanitization/inert_body.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAEH,OAAO,EAAC,qBAAqB,EAAC,MAAM,gCAAgC,CAAC;AAErE;;;;;;GAMG;AACH,MAAM,UAAU,kBAAkB,CAAC,UAAoB;IACrD,MAAM,mBAAmB,GAAG,IAAI,mBAAmB,CAAC,UAAU,CAAC,CAAC;IAChE,OAAO,oBAAoB,EAAE,CAAC,CAAC,CAAC,IAAI,eAAe,CAAC,mBAAmB,CAAC,CAAC,CAAC,CAAC,mBAAmB,CAAC;AACjG,CAAC;AASD;;;GAGG;AACH,MAAM,eAAe;IACnB,YAAoB,mBAAoC;QAApC,wBAAmB,GAAnB,mBAAmB,CAAiB;IAAG,CAAC;IAE5D,mBAAmB,CAAC,IAAY;QAC9B,2FAA2F;QAC3F,yFAAyF;QACzF,yFAAyF;QACzF,iEAAiE;QACjE,IAAI,GAAG,yBAAyB,GAAG,IAAI,CAAC;QACxC,IAAI;YACF,MAAM,IAAI,GAAG,IAAI,MAAM,CAAC,SAAS,EAAE;iBACjB,eAAe,CAAC,qBAAqB,CAAC,IAAI,CAAW,EAAE,WAAW,CAAC;iBACnE,IAAuB,CAAC;YAC1C,IAAI,IAAI,KAAK,IAAI,EAAE;gBACjB,uFAAuF;gBACvF,yFAAyF;gBACzF,qCAAqC;gBACrC,OAAO,IAAI,CAAC,mBAAmB,CAAC,mBAAmB,CAAC,IAAI,CAAC,CAAC;aAC3D;YACD,IAAI,CAAC,WAAW,CAAC,IAAI,CAAC,UAAW,CAAC,CAAC;YACnC,OAAO,IAAI,CAAC;SACb;QAAC,MAAM;YACN,OAAO,IAAI,CAAC;SACb;IACH,CAAC;CACF;AAED;;;;GAIG;AACH,MAAM,mBAAmB;IAGvB,YAAoB,UAAoB;QAApB,eAAU,GAAV,UAAU,CAAU;QACtC,IAAI,CAAC,aAAa,GAAG,IAAI,CAAC,UAAU,CAAC,cAAc,CAAC,kBAAkB,CAAC,oBAAoB,CAAC,CAAC;QAE7F,IAAI,IAAI,CAAC,aAAa,CAAC,IAAI,IAAI,IAAI,EAAE;YACnC,6FAA6F;YAC7F,yBAAyB;YACzB,MAAM,SAAS,GAAG,IAAI,CAAC,aAAa,CAAC,aAAa,CAAC,MAAM,CAAC,CAAC;YAC3D,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,SAAS,CAAC,CAAC;YAC1C,MAAM,gBAAgB,GAAG,IAAI,CAAC,aAAa,CAAC,aAAa,CAAC,MAAM,CAAC,CAAC;YAClE,SAAS,CAAC,WAAW,CAAC,gBAAgB,CAAC,CAAC;SACzC;IACH,CAAC;IAED,mBAAmB,CAAC,IAAY;QAC9B,gDAAgD;QAChD,MAAM,UAAU,GAAG,IAAI,CAAC,aAAa,CAAC,aAAa,CAAC,UAAU,CAAC,CAAC;QAChE,IAAI,SAAS,IAAI,UAAU,EAAE;YAC3B,UAAU,CAAC,SAAS,GAAG,qBAAqB,CAAC,IAAI,CAAW,CAAC;YAC7D,OAAO,UAAU,CAAC;SACnB;QAED,+FAA+F;QAC/F,6FAA6F;QAC7F,4FAA4F;QAC5F,2FAA2F;QAC3F,0FAA0F;QAC1F,4FAA4F;QAC5F,6CAA6C;QAC7C,MAAM,SAAS,GAAG,IAAI,CAAC,aAAa,CAAC,aAAa,CAAC,MAAM,CAAC,CAAC;QAC3D,SAAS,CAAC,SAAS,GAAG,qBAAqB,CAAC,IAAI,CAAW,CAAC;QAE5D,sBAAsB;QACtB,+CAA+C;QAC/C,IAAK,IAAI,CAAC,UAAkB,CAAC,YAAY,EAAE;YACzC,IAAI,CAAC,kBAAkB,CAAC,SAAS,CAAC,CAAC;SACpC;QAED,OAAO,SAAS,CAAC;IACnB,CAAC;IAED;;;;;;;OAOG;IACK,kBAAkB,CAAC,EAAW;QACpC,MAAM,OAAO,GAAG,EAAE,CAAC,UAAU,CAAC;QAC9B,kDAAkD;QAClD,KAAK,IAAI,CAAC,GAAG,OAAO,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC,GAAG,CAAC,EAAE,CAAC,EAAE,EAAE;YAC3C,MAAM,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC;YAC/B,MAAM,QAAQ,GAAG,MAAO,CAAC,IAAI,CAAC;YAC9B,IAAI,QAAQ,KAAK,WAAW,IAAI,QAAQ,CAAC,OAAO,CAAC,MAAM,CAAC,KAAK,CAAC,EAAE;gBAC9D,EAAE,CAAC,eAAe,CAAC,QAAQ,CAAC,CAAC;aAC9B;SACF;QACD,IAAI,SAAS,GAAG,EAAE,CAAC,UAAyB,CAAC;QAC7C,OAAO,SAAS,EAAE;YAChB,IAAI,SAAS,CAAC,QAAQ,KAAK,IAAI,CAAC,YAAY;gBAAE,IAAI,CAAC,kBAAkB,CAAC,SAAoB,CAAC,CAAC;YAC5F,SAAS,GAAG,SAAS,CAAC,WAAW,CAAC;SACnC;IACH,CAAC;CACF;AAED;;;;;;GAMG;AACH,MAAM,UAAU,oBAAoB;IAClC,IAAI;QACF,OAAO,CAAC,CAAC,IAAI,MAAM,CAAC,SAAS,EAAE,CAAC,eAAe,CAC3C,qBAAqB,CAAC,EAAE,CAAW,EAAE,WAAW,CAAC,CAAC;KACvD;IAAC,MAAM;QACN,OAAO,KAAK,CAAC;KACd;AACH,CAAC","sourcesContent":["/**\n * @license\n * Copyright Google LLC All Rights Reserved.\n *\n * Use of this source code is governed by an MIT-style license that can be\n * found in the LICENSE file at https://angular.io/license\n */\n\nimport {trustedHTMLFromString} from '../util/security/trusted_types';\n\n/**\n * This helper is used to get hold of an inert tree of DOM elements containing dirty HTML\n * that needs sanitizing.\n * Depending upon browser support we use one of two strategies for doing this.\n * Default: DOMParser strategy\n * Fallback: InertDocument strategy\n */\nexport function getInertBodyHelper(defaultDoc: Document): InertBodyHelper {\n  const inertDocumentHelper = new InertDocumentHelper(defaultDoc);\n  return isDOMParserAvailable() ? new DOMParserHelper(inertDocumentHelper) : inertDocumentHelper;\n}\n\nexport interface InertBodyHelper {\n  /**\n   * Get an inert DOM element containing DOM created from the dirty HTML string provided.\n   */\n  getInertBodyElement: (html: string) => HTMLElement | null;\n}\n\n/**\n * Uses DOMParser to create and fill an inert body element.\n * This is the default strategy used in browsers that support it.\n */\nclass DOMParserHelper implements InertBodyHelper {\n  constructor(private inertDocumentHelper: InertBodyHelper) {}\n\n  getInertBodyElement(html: string): HTMLElement|null {\n    // We add these extra elements to ensure that the rest of the content is parsed as expected\n    // e.g. leading whitespace is maintained and tags like `<meta>` do not get hoisted to the\n    // `<head>` tag. Note that the `<body>` tag is closed implicitly to prevent unclosed tags\n    // in `html` from consuming the otherwise explicit `</body>` tag.\n    html = '<body><remove></remove>' + html;\n    try {\n      const body = new window.DOMParser()\n                       .parseFromString(trustedHTMLFromString(html) as string, 'text/html')\n                       .body as HTMLBodyElement;\n      if (body === null) {\n        // In some browsers (e.g. Mozilla/5.0 iPad AppleWebKit Mobile) the `body` property only\n        // becomes available in the following tick of the JS engine. In that case we fall back to\n        // the `inertDocumentHelper` instead.\n        return this.inertDocumentHelper.getInertBodyElement(html);\n      }\n      body.removeChild(body.firstChild!);\n      return body;\n    } catch {\n      return null;\n    }\n  }\n}\n\n/**\n * Use an HTML5 `template` element, if supported, or an inert body element created via\n * `createHtmlDocument` to create and fill an inert DOM element.\n * This is the fallback strategy if the browser does not support DOMParser.\n */\nclass InertDocumentHelper implements InertBodyHelper {\n  private inertDocument: Document;\n\n  constructor(private defaultDoc: Document) {\n    this.inertDocument = this.defaultDoc.implementation.createHTMLDocument('sanitization-inert');\n\n    if (this.inertDocument.body == null) {\n      // usually there should be only one body element in the document, but IE doesn't have any, so\n      // we need to create one.\n      const inertHtml = this.inertDocument.createElement('html');\n      this.inertDocument.appendChild(inertHtml);\n      const inertBodyElement = this.inertDocument.createElement('body');\n      inertHtml.appendChild(inertBodyElement);\n    }\n  }\n\n  getInertBodyElement(html: string): HTMLElement|null {\n    // Prefer using <template> element if supported.\n    const templateEl = this.inertDocument.createElement('template');\n    if ('content' in templateEl) {\n      templateEl.innerHTML = trustedHTMLFromString(html) as string;\n      return templateEl;\n    }\n\n    // Note that previously we used to do something like `this.inertDocument.body.innerHTML = html`\n    // and we returned the inert `body` node. This was changed, because IE seems to treat setting\n    // `innerHTML` on an inserted element differently, compared to one that hasn't been inserted\n    // yet. In particular, IE appears to split some of the text into multiple text nodes rather\n    // than keeping them in a single one which ends up messing with Ivy's i18n parsing further\n    // down the line. This has been worked around by creating a new inert `body` and using it as\n    // the root node in which we insert the HTML.\n    const inertBody = this.inertDocument.createElement('body');\n    inertBody.innerHTML = trustedHTMLFromString(html) as string;\n\n    // Support: IE 11 only\n    // strip custom-namespaced attributes on IE<=11\n    if ((this.defaultDoc as any).documentMode) {\n      this.stripCustomNsAttrs(inertBody);\n    }\n\n    return inertBody;\n  }\n\n  /**\n   * When IE11 comes across an unknown namespaced attribute e.g. 'xlink:foo' it adds 'xmlns:ns1'\n   * attribute to declare ns1 namespace and prefixes the attribute with 'ns1' (e.g.\n   * 'ns1:xlink:foo').\n   *\n   * This is undesirable since we don't want to allow any of these custom attributes. This method\n   * strips them all.\n   */\n  private stripCustomNsAttrs(el: Element) {\n    const elAttrs = el.attributes;\n    // loop backwards so that we can support removals.\n    for (let i = elAttrs.length - 1; 0 < i; i--) {\n      const attrib = elAttrs.item(i);\n      const attrName = attrib!.name;\n      if (attrName === 'xmlns:ns1' || attrName.indexOf('ns1:') === 0) {\n        el.removeAttribute(attrName);\n      }\n    }\n    let childNode = el.firstChild as Node | null;\n    while (childNode) {\n      if (childNode.nodeType === Node.ELEMENT_NODE) this.stripCustomNsAttrs(childNode as Element);\n      childNode = childNode.nextSibling;\n    }\n  }\n}\n\n/**\n * We need to determine whether the DOMParser exists in the global context and\n * supports parsing HTML; HTML parsing support is not as wide as other formats, see\n * https://developer.mozilla.org/en-US/docs/Web/API/DOMParser#Browser_compatibility.\n *\n * @suppress {uselessCode}\n */\nexport function isDOMParserAvailable() {\n  try {\n    return !!new window.DOMParser().parseFromString(\n        trustedHTMLFromString('') as string, 'text/html');\n  } catch {\n    return false;\n  }\n}\n"]}
\No newline at end of file