Ignore SSL errors for web scraper

resolves #2114
This commit is contained in:
timothycarambat 2024-08-14 09:11:22 -07:00
parent b541623c9e
commit 619f6b3884
2 changed files with 4 additions and 3 deletions

View File

@ -57,6 +57,7 @@ async function getPageContent(link) {
const loader = new PuppeteerWebBaseLoader(link, { const loader = new PuppeteerWebBaseLoader(link, {
launchOptions: { launchOptions: {
headless: "new", headless: "new",
ignoreHTTPSErrors: true,
}, },
gotoOptions: { gotoOptions: {
waitUntil: "domcontentloaded", waitUntil: "domcontentloaded",

View File

@ -9,7 +9,7 @@
* We have gotten this report may times, marked them as duplicate or information and continue to get them. We communicate * We have gotten this report may times, marked them as duplicate or information and continue to get them. We communicate
* already that deployment (and security) of an instance is on the deployer and system admin deploying it. This would include * already that deployment (and security) of an instance is on the deployer and system admin deploying it. This would include
* isolation, firewalls, and the general security of the instance. * isolation, firewalls, and the general security of the instance.
*/ */
const VALID_PROTOCOLS = ["https:", "http:"]; const VALID_PROTOCOLS = ["https:", "http:"];
const INVALID_OCTETS = [192, 172, 10, 127]; const INVALID_OCTETS = [192, 172, 10, 127];
@ -32,7 +32,7 @@ function validURL(url) {
if (!VALID_PROTOCOLS.includes(destination.protocol)) return false; if (!VALID_PROTOCOLS.includes(destination.protocol)) return false;
if (isInvalidIp(destination)) return false; if (isInvalidIp(destination)) return false;
return true; return true;
} catch { } } catch {}
return false; return false;
} }