diff options
| author | Mohamed Bassem <me@mbassem.com> | 2025-06-22 21:15:42 +0000 |
|---|---|---|
| committer | Mohamed Bassem <me@mbassem.com> | 2025-06-22 21:15:42 +0000 |
| commit | b74377d232d7a329261249fb14e49e18475180b2 (patch) | |
| tree | a120c616a9c8af507bad290e13010b974fd57f62 /apps/workers | |
| parent | 7cc4b08aab654818933d655ee3cbd2db217090a2 (diff) | |
| download | karakeep-b74377d232d7a329261249fb14e49e18475180b2.tar.zst | |
fix(workers): Fix jsdom console logs leaking into worker logs
Diffstat (limited to 'apps/workers')
| -rw-r--r-- | apps/workers/workers/crawlerWorker.ts | 5 |
1 files changed, 3 insertions, 2 deletions
diff --git a/apps/workers/workers/crawlerWorker.ts b/apps/workers/workers/crawlerWorker.ts index bf083ff6..1d45dc12 100644 --- a/apps/workers/workers/crawlerWorker.ts +++ b/apps/workers/workers/crawlerWorker.ts @@ -9,7 +9,7 @@ import DOMPurify from "dompurify"; import { eq } from "drizzle-orm"; import { execa } from "execa"; import { isShuttingDown } from "exit"; -import { JSDOM } from "jsdom"; +import { JSDOM, VirtualConsole } from "jsdom"; import { DequeuedJob, Runner } from "liteque"; import metascraper from "metascraper"; import metascraperAmazon from "metascraper-amazon"; @@ -399,7 +399,8 @@ function extractReadableContent( logger.info( `[Crawler][${jobId}] Will attempt to extract readable content ...`, ); - const dom = new JSDOM(htmlContent, { url }); + const virtualConsole = new VirtualConsole(); + const dom = new JSDOM(htmlContent, { url, virtualConsole }); const readableContent = new Readability(dom.window.document).parse(); if (!readableContent || typeof readableContent.content !== "string") { return null; |
