Source: lib/util/xml_utils.js

  1. /*! @license
  2. * Shaka Player
  3. * Copyright 2016 Google LLC
  4. * SPDX-License-Identifier: Apache-2.0
  5. */
  6. goog.provide('shaka.util.XmlUtils');
  7. goog.require('goog.asserts');
  8. goog.require('shaka.log');
  9. goog.require('shaka.util.Lazy');
  10. goog.require('shaka.util.StringUtils');
  11. /**
  12. * @summary A set of XML utility functions.
  13. */
  14. shaka.util.XmlUtils = class {
  15. /**
  16. * Parse a string and return the resulting root element if it was valid XML.
  17. *
  18. * @param {string} xmlString
  19. * @param {string} expectedRootElemName
  20. * @return {Element}
  21. */
  22. static parseXmlString(xmlString, expectedRootElemName) {
  23. const parser = new DOMParser();
  24. const unsafeXmlString =
  25. shaka.util.XmlUtils.trustedHTMLFromString_.value()(xmlString);
  26. let unsafeXml = null;
  27. try {
  28. unsafeXml = parser.parseFromString(unsafeXmlString, 'text/xml');
  29. } catch (exception) {
  30. shaka.log.error('XML parsing exception:', exception);
  31. return null;
  32. }
  33. // According to MDN, parseFromString never returns null.
  34. goog.asserts.assert(unsafeXml, 'Parsed XML document cannot be null!');
  35. // Check for empty documents.
  36. const rootElem = unsafeXml.documentElement;
  37. if (!rootElem) {
  38. shaka.log.error('XML document was empty!');
  39. return null;
  40. }
  41. // Check for parser errors.
  42. const parserErrorElements = rootElem.getElementsByTagName('parsererror');
  43. if (parserErrorElements.length) {
  44. shaka.log.error('XML parser error found:', parserErrorElements[0]);
  45. return null;
  46. }
  47. // The top-level element in the loaded XML should have the name we expect.
  48. if (rootElem.tagName != expectedRootElemName) {
  49. shaka.log.error(
  50. `XML tag name does not match expected "${expectedRootElemName}":`,
  51. rootElem.tagName);
  52. return null;
  53. }
  54. // Cobalt browser doesn't support document.createNodeIterator.
  55. if (!('createNodeIterator' in document)) {
  56. return rootElem;
  57. }
  58. // SECURITY: Verify that the document does not contain elements from the
  59. // HTML or SVG namespaces, which could trigger script execution and XSS.
  60. const iterator = document.createNodeIterator(
  61. unsafeXml,
  62. NodeFilter.SHOW_ALL,
  63. );
  64. let currentNode;
  65. while (currentNode = iterator.nextNode()) {
  66. if (currentNode instanceof HTMLElement ||
  67. currentNode instanceof SVGElement) {
  68. shaka.log.error('XML document embeds unsafe content!');
  69. return null;
  70. }
  71. }
  72. return rootElem;
  73. }
  74. /**
  75. * Parse some data (auto-detecting the encoding) and return the resulting
  76. * root element if it was valid XML.
  77. * @param {BufferSource} data
  78. * @param {string} expectedRootElemName
  79. * @return {Element}
  80. */
  81. static parseXml(data, expectedRootElemName) {
  82. try {
  83. const string = shaka.util.StringUtils.fromBytesAutoDetect(data);
  84. return shaka.util.XmlUtils.parseXmlString(string, expectedRootElemName);
  85. } catch (exception) {
  86. shaka.log.error('parseXmlString threw!', exception);
  87. return null;
  88. }
  89. }
  90. /**
  91. * Converts a Element to BufferSource.
  92. * @param {!Element} elem
  93. * @return {!ArrayBuffer}
  94. */
  95. static toArrayBuffer(elem) {
  96. return shaka.util.StringUtils.toUTF8(elem.outerHTML);
  97. }
  98. };
  99. /**
  100. * Promote a string to TrustedHTML. This function is security-sensitive and
  101. * should only be used with security approval where the string is guaranteed not
  102. * to cause an XSS vulnerability.
  103. *
  104. * @private {!shaka.util.Lazy.<function(!string): (!TrustedHTML|!string)>}
  105. */
  106. shaka.util.XmlUtils.trustedHTMLFromString_ = new shaka.util.Lazy(() => {
  107. if (typeof trustedTypes !== 'undefined') {
  108. // Create a Trusted Types policy for promoting the string to TrustedHTML.
  109. // The Lazy wrapper ensures this policy is only created once.
  110. const policy = trustedTypes.createPolicy('shaka-player#xml', {
  111. createHTML: (s) => s,
  112. });
  113. return (s) => policy.createHTML(s);
  114. }
  115. // Fall back to strings in environments that don't support Trusted Types.
  116. return (s) => s;
  117. });