single-file-puppeteer.js 3.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596
  1. /*
  2. * Copyright 2010-2019 Gildas Lormeau
  3. * contact : gildas.lormeau <at> gmail.com
  4. *
  5. * This file is part of SingleFile.
  6. *
  7. * The code in this file is free software: you can redistribute it and/or
  8. * modify it under the terms of the GNU Affero General Public License
  9. * (GNU AGPL) as published by the Free Software Foundation, either version 3
  10. * of the License, or (at your option) any later version.
  11. *
  12. * The code in this file is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero
  15. * General Public License for more details.
  16. *
  17. * As additional permission under GNU AGPL version 3 section 7, you may
  18. * distribute UNMODIFIED VERSIONS OF THIS file without the copy of the GNU
  19. * AGPL normally required by section 4, provided you include this license
  20. * notice and a URL through which recipients can access the Corresponding
  21. * Source.
  22. */
  23. /* global require, exports, SingleFileBrowser, frameTree, document, window */
  24. const fs = require("fs");
  25. const puppeteer = require("puppeteer-core");
  26. const SCRIPTS = [
  27. "../lib/hooks/hooks-frame.js",
  28. "../lib/frame-tree/frame-tree.js",
  29. "../lib/single-file/util/doc-util.js",
  30. "../lib/single-file/util/doc-helper.js",
  31. "../lib/single-file/util/timeout.js",
  32. "../lib/single-file/vendor/css-tree.js",
  33. "../lib/single-file/vendor/html-srcset-parser.js",
  34. "../lib/single-file/vendor/css-minifier.js",
  35. "../lib/single-file/vendor/css-font-property-parser.js",
  36. "../lib/single-file/vendor/css-media-query-parser.js",
  37. "../lib/single-file/modules/html-minifier.js",
  38. "../lib/single-file/modules/css-fonts-minifier.js",
  39. "../lib/single-file/modules/css-fonts-alt-minifier.js",
  40. "../lib/single-file/modules/css-matched-rules.js",
  41. "../lib/single-file/modules/css-medias-alt-minifier.js",
  42. "../lib/single-file/modules/css-rules-minifier.js",
  43. "../lib/single-file/modules/html-images-alt-minifier.js",
  44. "../lib/single-file/modules/html-serializer.js",
  45. "../lib/single-file/single-file-core.js",
  46. "../lib/single-file/single-file-browser.js"
  47. ];
  48. exports.getPageData = async options => {
  49. const browserOptions = {
  50. headless: options.puppeteerHeadless === undefined ? true : options.puppeteerHeadless,
  51. "args": ["--disable-web-security"]
  52. };
  53. if (options.puppeteerExecutablePath) {
  54. browserOptions.executablePath = options.puppeteerExecutablePath;
  55. }
  56. const browser = await puppeteer.launch(browserOptions);
  57. let page;
  58. try {
  59. page = await browser.newPage();
  60. if (options.userAgent) {
  61. await page.setUserAgent(options.userAgent);
  62. }
  63. await page.setBypassCSP(true);
  64. if (options.loadDeferredImages) {
  65. SCRIPTS.unshift("../lib/lazy/web/web-lazy-loader-before");
  66. }
  67. await Promise.all(SCRIPTS.map(scriptPath => page.evaluateOnNewDocument(fs.readFileSync(require.resolve(scriptPath)).toString())));
  68. await page.goto(options.url, {
  69. waitUntil: options.puppeteerWaitUntil || "networkidle0"
  70. });
  71. const pageData = await page.evaluate(async options => {
  72. options.insertSingleFileComment = true;
  73. options.insertFaviconLink = true;
  74. if (!options.saveRawPage && !options.removeFrames) {
  75. options.framesData = await frameTree.getAsync(options);
  76. }
  77. options.doc = document;
  78. options.win = window;
  79. const SingleFile = SingleFileBrowser.getClass();
  80. const singleFile = new SingleFile(options);
  81. await singleFile.initialize();
  82. await singleFile.run();
  83. return singleFile.getPageData();
  84. }, options);
  85. return pageData;
  86. } finally {
  87. if (page) {
  88. page.close();
  89. }
  90. }
  91. };