content.js 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235
  1. /*
  2. * Copyright 2018 Gildas Lormeau
  3. * contact : gildas.lormeau <at> gmail.com
  4. *
  5. * This file is part of SingleFile.
  6. *
  7. * SingleFile is free software: you can redistribute it and/or modify
  8. * it under the terms of the GNU Lesser General Public License as published by
  9. * the Free Software Foundation, either version 3 of the License, or
  10. * (at your option) any later version.
  11. *
  12. * SingleFile is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. * GNU Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public License
  18. * along with SingleFile. If not, see <http://www.gnu.org/licenses/>.
  19. */
  20. /* global browser, SingleFile, singlefile, FrameTree, document, Blob, MouseEvent, getSelection, getComputedStyle, prompt, addEventListener, Node, HTMLElement */
  21. this.singlefile.top = this.singlefile.top || (() => {
  22. let processing = false;
  23. browser.runtime.onMessage.addListener(async message => {
  24. savePage(message);
  25. return {};
  26. });
  27. addEventListener("message", event => {
  28. if (typeof event.data === "string" && event.data.startsWith("__SingleFile__::")) {
  29. const message = JSON.parse(event.data.substring("__SingleFile__".length + 2));
  30. savePage(message);
  31. }
  32. });
  33. return true;
  34. async function savePage(message) {
  35. if (message.processStart && !processing && !message.options.frameId) {
  36. processing = true;
  37. try {
  38. const page = await processMessage(message);
  39. await downloadPage(page, message.options);
  40. revokeDownloadURL(page);
  41. } catch (error) {
  42. console.error(error); // eslint-disable-line no-console
  43. browser.runtime.sendMessage({ processError: true, error });
  44. }
  45. processing = false;
  46. }
  47. }
  48. async function processMessage(message) {
  49. const options = await getOptions(message.options);
  50. const processor = new (SingleFile.getClass())(options);
  51. fixInlineScripts();
  52. fixHeadNoScripts();
  53. if (options.selected) {
  54. selectSelectedContent(processor.SELECTED_CONTENT_ATTRIBUTE_NAME, processor.SELECTED_CONTENT_ROOT_ATTRIBUTE_NAME);
  55. }
  56. if (!options.removeFrames) {
  57. hideElementFrames();
  58. }
  59. if (options.removeHiddenElements) {
  60. selectRemovedElements(processor.REMOVED_CONTENT_ATTRIBUTE_NAME);
  61. }
  62. if (options.compressHTML) {
  63. selectPreserveElements(processor.PRESERVED_SPACE_ELEMENT_ATTRIBUTE_NAME);
  64. }
  65. options.url = options.url || document.location.href;
  66. options.content = options.content || getDoctype(document) + document.documentElement.outerHTML;
  67. await processor.initialize();
  68. if (options.removeHiddenElements) {
  69. unselectRemovedElements(processor.REMOVED_CONTENT_ATTRIBUTE_NAME);
  70. }
  71. if (options.compressHTML) {
  72. unselectPreserveElements(processor.PRESERVED_SPACE_ELEMENT_ATTRIBUTE_NAME);
  73. }
  74. if (options.shadowEnabled) {
  75. singlefile.ui.init();
  76. }
  77. await processor.preparePageData();
  78. const page = processor.getPageData();
  79. if (options.selected) {
  80. unselectSelectedContent(processor.SELECTED_CONTENT_ATTRIBUTE_NAME, processor.SELECTED_CONTENT_ROOT_ATTRIBUTE_NAME);
  81. }
  82. const date = new Date();
  83. page.filename = page.title + (options.appendSaveDate ? " (" + date.toISOString().split("T")[0] + " " + date.toLocaleTimeString() + ")" : "") + ".html";
  84. page.url = URL.createObjectURL(new Blob([page.content], { type: "text/html" }));
  85. if (options.shadowEnabled) {
  86. singlefile.ui.end();
  87. }
  88. return page;
  89. }
  90. function revokeDownloadURL(page) {
  91. URL.revokeObjectURL(page.url);
  92. }
  93. function fixInlineScripts() {
  94. document.querySelectorAll("script").forEach(element => element.textContent = element.textContent.replace(/<\/script>/gi, "<\\/script>"));
  95. }
  96. function hideElementFrames() {
  97. document.head.querySelectorAll("*:not(meta):not(title):not(link):not(style):not(script)").forEach(element => element.hidden = true);
  98. }
  99. function fixHeadNoScripts() {
  100. document.head.querySelectorAll("noscript").forEach(noscriptElement => document.body.insertBefore(noscriptElement, document.body.firstChild));
  101. }
  102. function selectPreserveElements(PRESERVED_SPACE_ELEMENT_ATTRIBUTE_NAME) {
  103. document.querySelectorAll("*").forEach(element => {
  104. const style = getComputedStyle(element);
  105. if (style.whiteSpace.startsWith("pre")) {
  106. element.setAttribute(PRESERVED_SPACE_ELEMENT_ATTRIBUTE_NAME, "");
  107. }
  108. });
  109. }
  110. function unselectPreserveElements(PRESERVED_SPACE_ELEMENT_ATTRIBUTE_NAME) {
  111. document.querySelectorAll("[" + PRESERVED_SPACE_ELEMENT_ATTRIBUTE_NAME + "]").forEach(element => element.removeAttribute(PRESERVED_SPACE_ELEMENT_ATTRIBUTE_NAME));
  112. }
  113. function selectRemovedElements(REMOVED_CONTENT_ATTRIBUTE_NAME) {
  114. document.querySelectorAll("html > body *:not(style):not(script):not(link):not(frame):not(iframe):not(object)").forEach(element => {
  115. const style = getComputedStyle(element);
  116. if (element instanceof HTMLElement && (element.hidden || style.display == "none" || ((style.opacity === 0 || style.visibility == "hidden") && !element.clientWidth && !element.clientHeight)) && !element.querySelector("iframe, frame, object[type=\"text/html\"][data]")) {
  117. element.setAttribute(REMOVED_CONTENT_ATTRIBUTE_NAME, "");
  118. }
  119. });
  120. }
  121. function unselectRemovedElements(REMOVED_CONTENT_ATTRIBUTE_NAME) {
  122. document.querySelectorAll("[" + REMOVED_CONTENT_ATTRIBUTE_NAME + "]").forEach(element => element.removeAttribute(REMOVED_CONTENT_ATTRIBUTE_NAME));
  123. }
  124. function selectSelectedContent(SELECTED_CONTENT_ATTRIBUTE_NAME, SELECTED_CONTENT_ROOT_ATTRIBUTE_NAME) {
  125. const selection = getSelection();
  126. const range = selection.rangeCount ? selection.getRangeAt(0) : null;
  127. const treeWalker = document.createTreeWalker(range.commonAncestorContainer);
  128. let selectionFound = false;
  129. const ancestorElement = range.commonAncestorContainer != Node.ELEMENT_NODE ? range.commonAncestorContainer.parentElement : range.commonAncestorContainer;
  130. ancestorElement.setAttribute(SELECTED_CONTENT_ROOT_ATTRIBUTE_NAME, "");
  131. while (treeWalker.nextNode() && treeWalker.currentNode != range.endContainer) {
  132. if (treeWalker.currentNode == range.startContainer) {
  133. selectionFound = true;
  134. }
  135. if (selectionFound) {
  136. const element = treeWalker.currentNode.nodeType == Node.ELEMENT_NODE ? treeWalker.currentNode : treeWalker.currentNode.parentElement;
  137. element.setAttribute(SELECTED_CONTENT_ATTRIBUTE_NAME, "");
  138. }
  139. }
  140. }
  141. function unselectSelectedContent(SELECTED_CONTENT_ATTRIBUTE_NAME, SELECTED_CONTENT_ROOT_ATTRIBUTE_NAME) {
  142. document.querySelectorAll("[" + SELECTED_CONTENT_ATTRIBUTE_NAME + "]").forEach(selectedContent => selectedContent.removeAttribute(SELECTED_CONTENT_ATTRIBUTE_NAME));
  143. document.querySelectorAll("[" + SELECTED_CONTENT_ROOT_ATTRIBUTE_NAME + "]").forEach(selectedContent => selectedContent.removeAttribute(SELECTED_CONTENT_ROOT_ATTRIBUTE_NAME));
  144. }
  145. async function getOptions(options) {
  146. options.canvasData = getCanvasData();
  147. if (!options.removeFrames) {
  148. options.framesData = await FrameTree.getFramesData();
  149. }
  150. options.jsEnabled = true;
  151. options.onprogress = async event => {
  152. if (event.type == event.RESOURCES_INITIALIZED || event.type == event.RESOURCE_LOADED) {
  153. try {
  154. await browser.runtime.sendMessage({ processProgress: true, index: event.details.index, maxIndex: event.details.max });
  155. } catch (error) {
  156. // ignored
  157. }
  158. if (options.shadowEnabled) {
  159. singlefile.ui.onprogress(event);
  160. }
  161. } else if (event.type == event.PAGE_ENDED) {
  162. try {
  163. await browser.runtime.sendMessage({ processEnd: true });
  164. } catch (error) {
  165. // ignored
  166. }
  167. }
  168. };
  169. return options;
  170. }
  171. function getCanvasData() {
  172. const canvasData = [];
  173. document.querySelectorAll("canvas").forEach(canvasElement => {
  174. try {
  175. canvasData.push({ dataURI: canvasElement.toDataURL("image/png", ""), width: canvasElement.clientWidth, height: canvasElement.clientHeight });
  176. } catch (error) {
  177. canvasData.push(null);
  178. }
  179. });
  180. return canvasData;
  181. }
  182. function getDoctype(doc) {
  183. const docType = doc.doctype;
  184. let docTypeString;
  185. if (docType) {
  186. docTypeString = "<!DOCTYPE " + docType.nodeName;
  187. if (docType.publicId) {
  188. docTypeString += " PUBLIC \"" + docType.publicId + "\"";
  189. if (docType.systemId)
  190. docTypeString += " \"" + docType.systemId + "\"";
  191. } else if (docType.systemId)
  192. docTypeString += " SYSTEM \"" + docType.systemId + "\"";
  193. if (docType.internalSubset)
  194. docTypeString += " [" + docType.internalSubset + "]";
  195. return docTypeString + ">\n";
  196. }
  197. return "";
  198. }
  199. async function downloadPage(page, options) {
  200. const response = await browser.runtime.sendMessage({ download: true, url: page.url, saveAs: options.confirmFilename, filename: page.filename });
  201. if (response.notSupported) {
  202. if (options.confirmFilename) {
  203. page.filename = prompt("File name", page.filename);
  204. }
  205. if (page.filename && page.filename.length) {
  206. const link = document.createElement("a");
  207. document.body.appendChild(link);
  208. link.download = page.filename;
  209. link.href = page.url;
  210. link.dispatchEvent(new MouseEvent("click"));
  211. link.remove();
  212. }
  213. }
  214. }
  215. })();