fix(sitemap): temporarily disable tlsclient

This commit is contained in:
Móricz Gergő 2025-01-23 06:56:15 +01:00
parent d162247703
commit 51a0e233e3

View File

@ -37,42 +37,45 @@ export async function getLinksFromSitemap(
) { ) {
content = fetchResponse.document.rawHtml!; content = fetchResponse.document.rawHtml!;
} else { } else {
logger.debug( // logger.debug(
"Failed to scrape sitemap via fetch, falling back to TLSClient...", // "Failed to scrape sitemap via fetch, falling back to TLSClient...",
{ // {
error: fetchResponse.success // error: fetchResponse.success
? fetchResponse.document // ? fetchResponse.document
: fetchResponse.error, // : fetchResponse.error,
}, // },
); // );
const tlsResponse = await scrapeURL( // const tlsResponse = await scrapeURL(
"sitemap", // "sitemap",
sitemapUrl, // sitemapUrl,
scrapeOptions.parse({ formats: ["rawHtml"] }), // scrapeOptions.parse({ formats: ["rawHtml"] }),
{ forceEngine: "fire-engine;tlsclient", v0DisableJsDom: true }, // { forceEngine: "fire-engine;tlsclient", v0DisableJsDom: true },
); // );
if ( // if (
tlsResponse.success && // tlsResponse.success &&
tlsResponse.document.metadata.statusCode >= 200 && // tlsResponse.document.metadata.statusCode >= 200 &&
tlsResponse.document.metadata.statusCode < 300 // tlsResponse.document.metadata.statusCode < 300
) { // ) {
content = tlsResponse.document.rawHtml!; // content = tlsResponse.document.rawHtml!;
} else { // } else {
logger.error( logger.error(
`Request failed for ${sitemapUrl}, ran out of engines!`, `Request failed for ${sitemapUrl}, ran out of engines!`,
{ {
method: "getLinksFromSitemap", method: "getLinksFromSitemap",
mode, mode,
sitemapUrl, sitemapUrl,
error: tlsResponse.success // error: tlsResponse.success
? tlsResponse.document // ? tlsResponse.document
: tlsResponse.error, // : tlsResponse.error,
error: fetchResponse.success
? fetchResponse.document
: fetchResponse.error,
}, },
); );
return 0; return 0;
} // }
} }
} else { } else {
const fetchResponse = await scrapeURL( const fetchResponse = await scrapeURL(