// Copied from https://gist.github.com/devster31/4e8c6548fd16ffb75c02e6f24e27f9b9 import * as cheerio from "cheerio"; import { BookmarkTypes } from "@hoarder/shared/types/bookmarks"; import { zExportSchema } from "./exportBookmarks"; export interface ParsedBookmark { title: string; content?: | { type: BookmarkTypes.LINK; url: string } | { type: BookmarkTypes.TEXT; text: string }; tags: string[]; addDate?: number; notes?: string; } export async function parseNetscapeBookmarkFile( file: File, ): Promise { const textContent = await file.text(); if (!textContent.startsWith("")) { throw Error("The uploaded html file does not seem to be a bookmark file"); } const $ = cheerio.load(textContent); return $("a") .map(function (_index, a) { const $a = $(a); const addDate = $a.attr("add_date"); let tags: string[] = []; const tagsStr = $a.attr("tags"); try { tags = tagsStr && tagsStr.length > 0 ? tagsStr.split(",") : []; } catch (e) { /* empty */ } const url = $a.attr("href"); return { title: $a.text(), content: url ? { type: BookmarkTypes.LINK as const, url } : undefined, tags, addDate: typeof addDate === "undefined" ? undefined : parseInt(addDate), }; }) .get(); } export async function parsePocketBookmarkFile( file: File, ): Promise { const textContent = await file.text(); const $ = cheerio.load(textContent); return $("a") .map(function (_index, a) { const $a = $(a); const addDate = $a.attr("time_added"); let tags: string[] = []; const tagsStr = $a.attr("tags"); try { tags = tagsStr && tagsStr.length > 0 ? tagsStr.split(",") : []; } catch (e) { /* empty */ } const url = $a.attr("href"); return { title: $a.text(), content: url ? { type: BookmarkTypes.LINK as const, url } : undefined, tags, addDate: typeof addDate === "undefined" ? undefined : parseInt(addDate), }; }) .get(); } export async function parseHoarderBookmarkFile( file: File, ): Promise { const textContent = await file.text(); const parsed = zExportSchema.safeParse(JSON.parse(textContent)); if (!parsed.success) { throw new Error( `The uploaded JSON file contains an invalid bookmark file: ${parsed.error.toString()}`, ); } return parsed.data.bookmarks.map((bookmark) => { let content = undefined; if (bookmark.content?.type == BookmarkTypes.LINK) { content = { type: BookmarkTypes.LINK as const, url: bookmark.content.url, }; } else if (bookmark.content?.type == BookmarkTypes.TEXT) { content = { type: BookmarkTypes.TEXT as const, text: bookmark.content.text, }; } return { title: bookmark.title ?? "", content, tags: bookmark.tags, addDate: bookmark.createdAt, notes: bookmark.note ?? undefined, }; }); }