example.js 2.5 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374
  1. /*
  2. * Copyright 2010-2019 Gildas Lormeau
  3. * contact : gildas.lormeau <at> gmail.com
  4. *
  5. * This file is part of SingleFile.
  6. *
  7. * The code in this file is free software: you can redistribute it and/or
  8. * modify it under the terms of the GNU Affero General Public License
  9. * (GNU AGPL) as published by the Free Software Foundation, either version 3
  10. * of the License, or (at your option) any later version.
  11. *
  12. * The code in this file is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero
  15. * General Public License for more details.
  16. *
  17. * As additional permission under GNU AGPL version 3 section 7, you may
  18. * distribute UNMODIFIED VERSIONS OF THIS file without the copy of the GNU
  19. * AGPL normally required by section 4, provided you include this license
  20. * notice and a URL through which recipients can access the Corresponding
  21. * Source.
  22. */
  23. /* global require */
  24. const fs = require("fs");
  25. const jsdom = require("jsdom");
  26. const request = require("request-promise-native");
  27. const SingleFileNode = require("./single-file-jsdom.js");
  28. run({
  29. url: "https://github.com/gildas-lormeau/SingleFile",
  30. userAgent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:65.0) Gecko Firefox AppleWebKit (KHTML, like Gecko) Chrome Safari",
  31. removeHiddenElements: true,
  32. removeUnusedStyles: true,
  33. removeUnusedFonts: true,
  34. removeFrames: true,
  35. removeImports: true,
  36. removeScripts: true,
  37. compressHTML: true,
  38. compressCSS: true,
  39. loadDeferredImages: false,
  40. filenameTemplate: "{page-title} ({date-iso} {time-locale}).html",
  41. removeAudioSrc: true,
  42. removeVideoSrc: true,
  43. displayInfobar: true,
  44. removeAlternativeFonts: true,
  45. removeAlternativeMedias: true,
  46. removeAlternativeImages: true,
  47. groupDuplicateImages: true
  48. });
  49. async function run(options) {
  50. const pageContent = (await request({
  51. method: "GET",
  52. uri: options.url,
  53. resolveWithFullResponse: true,
  54. encoding: null,
  55. headers: {
  56. "User-Agent": options.userAgent
  57. }
  58. })).body.toString();
  59. const dom = new jsdom.JSDOM(pageContent, { url: options.url, virtualConsole: new jsdom.VirtualConsole(), userAgent: options.userAgent });
  60. options.win = dom.window;
  61. options.doc = dom.window.document;
  62. options.saveRawPage = true;
  63. const processor = new (SingleFileNode.getClass())(options);
  64. await processor.initialize();
  65. await processor.run();
  66. const page = await processor.getPageData();
  67. fs.writeFileSync(page.filename, page.content);
  68. }