single-file-puppeteer.js 3.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100
  1. /*
  2. * Copyright 2010-2019 Gildas Lormeau
  3. * contact : gildas.lormeau <at> gmail.com
  4. *
  5. * This file is part of SingleFile.
  6. *
  7. * The code in this file is free software: you can redistribute it and/or
  8. * modify it under the terms of the GNU Affero General Public License
  9. * (GNU AGPL) as published by the Free Software Foundation, either version 3
  10. * of the License, or (at your option) any later version.
  11. *
  12. * The code in this file is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero
  15. * General Public License for more details.
  16. *
  17. * As additional permission under GNU AGPL version 3 section 7, you may
  18. * distribute UNMODIFIED VERSIONS OF THIS file without the copy of the GNU
  19. * AGPL normally required by section 4, provided you include this license
  20. * notice and a URL through which recipients can access the Corresponding
  21. * Source.
  22. */
  23. /* global require, exports, SingleFileBrowser, frameTree, document, window */
  24. const fs = require("fs");
  25. const puppeteer = require("puppeteer-core");
  26. const SCRIPTS = [
  27. "../lib/hooks/hooks-frame.js",
  28. "../lib/frame-tree/frame-tree.js",
  29. "../lib/single-file/util/doc-util.js",
  30. "../lib/single-file/util/doc-helper.js",
  31. "../lib/single-file/util/timeout.js",
  32. "../lib/single-file/vendor/css-tree.js",
  33. "../lib/single-file/vendor/html-srcset-parser.js",
  34. "../lib/single-file/vendor/css-minifier.js",
  35. "../lib/single-file/vendor/css-font-property-parser.js",
  36. "../lib/single-file/vendor/css-media-query-parser.js",
  37. "../lib/single-file/modules/html-minifier.js",
  38. "../lib/single-file/modules/css-fonts-minifier.js",
  39. "../lib/single-file/modules/css-fonts-alt-minifier.js",
  40. "../lib/single-file/modules/css-matched-rules.js",
  41. "../lib/single-file/modules/css-medias-alt-minifier.js",
  42. "../lib/single-file/modules/css-rules-minifier.js",
  43. "../lib/single-file/modules/html-images-alt-minifier.js",
  44. "../lib/single-file/modules/html-serializer.js",
  45. "../lib/single-file/single-file-core.js",
  46. "../lib/single-file/single-file-browser.js"
  47. ];
  48. exports.getPageData = async options => {
  49. const browserOptions = {};
  50. if (options.browserHeadless !== undefined) {
  51. browserOptions.headless = options.browserHeadless;
  52. }
  53. if (options.browserDisableWebSecurity === undefined || options.browserDisableWebSecurity) {
  54. browserOptions.args = ["--disable-web-security"];
  55. }
  56. if (options.browserExecutablePath) {
  57. browserOptions.executablePath = options.browserExecutablePath;
  58. }
  59. let browser;
  60. try {
  61. browser = await puppeteer.launch(browserOptions);
  62. const page = await browser.newPage();
  63. if (options.userAgent) {
  64. await page.setUserAgent(options.userAgent);
  65. }
  66. if (options.browserBypassCSP === undefined || options.browserBypassCSP) {
  67. await page.setBypassCSP(true);
  68. }
  69. if (options.loadDeferredImages) {
  70. SCRIPTS.unshift("../lib/lazy/web/web-lazy-loader-before");
  71. }
  72. await Promise.all(SCRIPTS.map(scriptPath => page.evaluateOnNewDocument(fs.readFileSync(require.resolve(scriptPath)).toString())));
  73. await page.goto(options.url, {
  74. waitUntil: "networkidle0"
  75. });
  76. return await page.evaluate(async options => {
  77. options.insertSingleFileComment = true;
  78. options.insertFaviconLink = true;
  79. if (!options.saveRawPage && !options.removeFrames) {
  80. options.framesData = await frameTree.getAsync(options);
  81. }
  82. options.doc = document;
  83. options.win = window;
  84. const SingleFile = SingleFileBrowser.getClass();
  85. const singleFile = new SingleFile(options);
  86. await singleFile.initialize();
  87. await singleFile.run();
  88. return await singleFile.getPageData();
  89. }, options);
  90. } finally {
  91. if (browser) {
  92. await browser.close();
  93. }
  94. }
  95. };