import { CheerioAPI } from 'cheerio'; import DoubanAbstractLoadHandler from "./DoubanAbstractLoadHandler"; import DoubanNoteSubject from 'douban/model/DoubanNoteSubject'; import DoubanPlugin from "main"; import { DoubanPluginSettings } from "douban/Douban"; import DoubanSubject from "douban/model/DoubanSubject"; import html2markdown from '@notable/html2markdown'; import { moment } from "obsidian"; export default class DoubanNoteLoadHandler extends DoubanAbstractLoadHandler { parseText(extract: DoubanNoteSubject, settings:DoubanPluginSettings): string { return settings.bookTemplate ? settings.noteTemplate .replaceAll("{{id}}", extract.id) .replaceAll("{{type}}", extract.type ? extract.type : "") .replaceAll("{{title}}", extract.title ? extract.title : "") .replaceAll("{{desc}}", extract.desc ? extract.desc : "") .replaceAll("{{image}}", extract.image ? extract.image : "") .replaceAll("{{timePublished}}", extract.timePublished ? moment(extract.timePublished).format(settings.dateTimeFormat) : "") .replaceAll("{{url}}", extract.url ? extract.url : "") .replaceAll("{{content}}", extract.content ? extract.content : "") .replaceAll("{{url}}", extract.url ? extract.url : "") .replaceAll("{{authorUrl}}", extract.authorUrl ? extract.authorUrl : "") .replaceAll("{{author}}", extract.author ? extract.author : "") : undefined; } support(extract: DoubanSubject): boolean { return extract && extract.type && (extract.type.contains("日记") || extract.type.contains("Note") || extract.type.contains("Article")); } constructor(doubanPlugin:DoubanPlugin) { super(doubanPlugin); } parseSubjectFromHtml(html: CheerioAPI): DoubanNoteSubject { var title = html(html("head > meta[property= 'og:title']").get(0)).attr("content"); var desc = html(html("head > meta[property= 'og:description']").get(0)).attr("content"); var url = html(html("head > meta[property= 'og:url']").get(0)).attr("content"); var image = html(html("head > meta[property= 'og:image']").get(0)).attr("content"); var type = html(html("head > meta[property= 'og:type']").get(0)).attr("content"); var authorA = html(html("a.note-author").get(0)); var timePublished = html(html(".pub-date").get(0)).text(); var content = html(html(".note").get(1)); var idPattern = /(\d){5,10}/g; var id = idPattern.exec(url); const result:DoubanNoteSubject = { image: image, timePublished: timePublished ? new Date(timePublished) : null, content: content ? html2markdown(content.toString()): "", id: id ? id[0] : "", type: "Article", title: title, desc: desc, url: url, author: authorA ? authorA.text() : null, authorUrl: authorA ? authorA.attr("href") : null, }; return result; } }