diff options
| author | Mohamed Bassem <me@mbassem.com> | 2025-12-07 11:43:14 +0000 |
|---|---|---|
| committer | Mohamed Bassem <me@mbassem.com> | 2025-12-07 11:43:14 +0000 |
| commit | e3cc54636349361a8672dc261973b19680f614e3 (patch) | |
| tree | f5ed91c426c46ef6279d18d4ecc654e9a827a252 /apps/workers | |
| parent | cf2a12c8046b29c3fcf315d3a2598555175e1aee (diff) | |
| download | karakeep-e3cc54636349361a8672dc261973b19680f614e3.tar.zst | |
fix: better extraction for youtube thumbnails. #2204
Diffstat (limited to 'apps/workers')
| -rw-r--r-- | apps/workers/package.json | 1 | ||||
| -rw-r--r-- | apps/workers/workers/crawlerWorker.ts | 13 |
2 files changed, 14 insertions, 0 deletions
diff --git a/apps/workers/package.json b/apps/workers/package.json index 1b5b2c95..fa7ffeac 100644 --- a/apps/workers/package.json +++ b/apps/workers/package.json @@ -41,6 +41,7 @@ "metascraper-title": "^5.49.5", "metascraper-twitter": "^5.45.6", "metascraper-url": "^5.49.5", + "metascraper-youtube": "^5.49.7", "node-cron": "^3.0.3", "node-fetch": "^3.3.2", "pdf2json": "^3.1.5", diff --git a/apps/workers/workers/crawlerWorker.ts b/apps/workers/workers/crawlerWorker.ts index 44f8f0c3..cb55523f 100644 --- a/apps/workers/workers/crawlerWorker.ts +++ b/apps/workers/workers/crawlerWorker.ts @@ -26,6 +26,7 @@ import metascraperPublisher from "metascraper-publisher"; import metascraperTitle from "metascraper-title"; import metascraperTwitter from "metascraper-twitter"; import metascraperUrl from "metascraper-url"; +import metascraperYoutube from "metascraper-youtube"; import { crawlerStatusCodeCounter, workerStatsCounter } from "metrics"; import { fetchWithProxy, @@ -125,6 +126,18 @@ const metascraperParser = metascraper([ datePublished: true, }), metascraperAmazon(), + metascraperYoutube({ + gotOpts: { + agent: { + http: serverConfig.proxy.httpProxy + ? new HttpProxyAgent(getRandomProxy(serverConfig.proxy.httpProxy)) + : undefined, + https: serverConfig.proxy.httpsProxy + ? new HttpsProxyAgent(getRandomProxy(serverConfig.proxy.httpsProxy)) + : undefined, + }, + }, + }), metascraperReddit(), metascraperAuthor(), metascraperPublisher(), |
