mirror of
https://github.com/laurent22/joplin.git
synced 2024-12-15 09:04:04 +02:00
64 lines
1.5 KiB
JavaScript
64 lines
1.5 KiB
JavaScript
const jsdom = require("jsdom");
|
|
const { JSDOM } = jsdom;
|
|
const urlUtils = require('lib/urlUtils.js');
|
|
|
|
function headAndBodyHtml_(doc) {
|
|
const output = [];
|
|
if (doc.head) output.push(doc.head.innerHTML);
|
|
if (doc.body) output.push(doc.body.innerHTML);
|
|
return output.join('\n');
|
|
}
|
|
|
|
const htmlUtils = {
|
|
|
|
extractImageUrls(html) {
|
|
if (!html) return [];
|
|
|
|
const dom = new JSDOM(html);
|
|
const imgs = dom.window.document.getElementsByTagName('img');
|
|
const output = [];
|
|
|
|
for (const img of imgs) {
|
|
const src = img.getAttribute('src');
|
|
if (!src) continue;
|
|
output.push(src);
|
|
}
|
|
|
|
return output;
|
|
},
|
|
|
|
replaceImageUrls(html, callback) {
|
|
if (!html) return '';
|
|
|
|
const dom = new JSDOM(html);
|
|
const doc = dom.window.document;
|
|
const imgs = doc.getElementsByTagName('img');
|
|
|
|
for (const img of imgs) {
|
|
const src = img.getAttribute('src');
|
|
const newSrc = callback(src);
|
|
img.setAttribute('src', newSrc);
|
|
}
|
|
|
|
// This function returns the head and body but without the <head> and <body>
|
|
// tag, which for our purpose are not needed and can cause issues when present.
|
|
return headAndBodyHtml_(doc);
|
|
},
|
|
|
|
prependBaseUrl(html, baseUrl) {
|
|
const dom = new JSDOM(html);
|
|
const doc = dom.window.document;
|
|
const anchors = doc.getElementsByTagName('a');
|
|
|
|
for (const anchor of anchors) {
|
|
const href = anchor.getAttribute('href');
|
|
const newHref = urlUtils.prependBaseUrl(href, baseUrl);
|
|
anchor.setAttribute('href', newHref);
|
|
}
|
|
|
|
return headAndBodyHtml_(doc);
|
|
},
|
|
|
|
};
|
|
|
|
module.exports = htmlUtils; |