2020-10-09 18:35:46 +01:00
|
|
|
import { ImportExportResult } from './types';
|
2020-11-05 16:58:23 +00:00
|
|
|
import { _ } from '../../locale';
|
2020-10-09 18:35:46 +01:00
|
|
|
|
2021-01-22 17:41:11 +00:00
|
|
|
import InteropService_Importer_Base from './InteropService_Importer_Base';
|
|
|
|
import Folder from '../../models/Folder';
|
|
|
|
import Note from '../../models/Note';
|
2021-08-22 16:35:45 -07:00
|
|
|
import { NoteEntity } from '../database/types';
|
|
|
|
import { basename, filename, rtrimSlashes, fileExtension, dirname } from '../../path-utils';
|
2021-01-22 17:41:11 +00:00
|
|
|
import shim from '../../shim';
|
|
|
|
import markdownUtils from '../../markdownUtils';
|
2021-08-22 16:35:45 -07:00
|
|
|
import htmlUtils from '../../htmlUtils';
|
2022-05-26 15:57:44 +01:00
|
|
|
import { unique } from '../../ArrayUtils';
|
2020-11-05 16:58:23 +00:00
|
|
|
const { pregQuote } = require('../../string-utils-common');
|
2021-08-22 16:35:45 -07:00
|
|
|
import { MarkupToHtml } from '@joplin/renderer';
|
2018-02-26 19:25:54 +00:00
|
|
|
|
2020-10-09 18:35:46 +01:00
|
|
|
export default class InteropService_Importer_Md extends InteropService_Importer_Base {
|
2021-08-22 16:35:45 -07:00
|
|
|
private importedNotes: Record<string, NoteEntity> = {};
|
|
|
|
|
2023-03-06 14:22:01 +00:00
|
|
|
public async exec(result: ImportExportResult) {
|
2018-02-27 20:04:38 +00:00
|
|
|
let parentFolderId = null;
|
2018-02-26 19:25:54 +00:00
|
|
|
|
2018-09-09 20:32:23 +01:00
|
|
|
const sourcePath = rtrimSlashes(this.sourcePath_);
|
2018-06-26 00:07:53 +01:00
|
|
|
|
2018-02-26 19:25:54 +00:00
|
|
|
const filePaths = [];
|
2018-09-09 20:32:23 +01:00
|
|
|
if (await shim.fsDriver().isDirectory(sourcePath)) {
|
2018-02-27 20:04:38 +00:00
|
|
|
if (!this.options_.destinationFolder) {
|
2018-09-09 20:32:23 +01:00
|
|
|
const folderTitle = await Folder.findUniqueItemTitle(basename(sourcePath));
|
2018-02-27 20:04:38 +00:00
|
|
|
const folder = await Folder.save({ title: folderTitle });
|
|
|
|
parentFolderId = folder.id;
|
|
|
|
} else {
|
|
|
|
parentFolderId = this.options_.destinationFolder.id;
|
|
|
|
}
|
2018-09-09 20:32:23 +01:00
|
|
|
|
2020-11-25 14:40:25 +00:00
|
|
|
await this.importDirectory(sourcePath, parentFolderId);
|
2018-02-26 19:25:54 +00:00
|
|
|
} else {
|
2018-02-27 20:04:38 +00:00
|
|
|
if (!this.options_.destinationFolder) throw new Error(_('Please specify the notebook where the notes should be imported to.'));
|
2019-07-29 15:43:53 +02:00
|
|
|
parentFolderId = this.options_.destinationFolder.id;
|
2018-09-09 20:32:23 +01:00
|
|
|
filePaths.push(sourcePath);
|
2018-02-26 19:25:54 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
for (let i = 0; i < filePaths.length; i++) {
|
2018-09-09 20:32:23 +01:00
|
|
|
await this.importFile(filePaths[i], parentFolderId);
|
2018-02-26 19:25:54 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2023-03-06 14:22:01 +00:00
|
|
|
public async importDirectory(dirPath: string, parentFolderId: string) {
|
2018-09-09 20:32:23 +01:00
|
|
|
const supportedFileExtension = this.metadata().fileExtensions;
|
|
|
|
const stats = await shim.fsDriver().readDirStats(dirPath);
|
|
|
|
for (let i = 0; i < stats.length; i++) {
|
|
|
|
const stat = stats[i];
|
|
|
|
|
|
|
|
if (stat.isDirectory()) {
|
2022-03-29 00:13:13 +08:00
|
|
|
if (await this.isDirectoryEmpty(`${dirPath}/${stat.path}`)) {
|
|
|
|
continue;
|
|
|
|
}
|
2018-09-09 20:32:23 +01:00
|
|
|
const folderTitle = await Folder.findUniqueItemTitle(basename(stat.path));
|
|
|
|
const folder = await Folder.save({ title: folderTitle, parent_id: parentFolderId });
|
2020-11-25 14:40:25 +00:00
|
|
|
await this.importDirectory(`${dirPath}/${basename(stat.path)}`, folder.id);
|
2018-09-09 20:32:23 +01:00
|
|
|
} else if (supportedFileExtension.indexOf(fileExtension(stat.path).toLowerCase()) >= 0) {
|
2020-11-25 14:40:25 +00:00
|
|
|
await this.importFile(`${dirPath}/${stat.path}`, parentFolderId);
|
2018-09-09 20:32:23 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-03-29 00:13:13 +08:00
|
|
|
private async isDirectoryEmpty(dirPath: string) {
|
|
|
|
const supportedFileExtension = this.metadata().fileExtensions;
|
|
|
|
const innerStats = await shim.fsDriver().readDirStats(dirPath);
|
|
|
|
for (let i = 0; i < innerStats.length; i++) {
|
|
|
|
const innerStat = innerStats[i];
|
|
|
|
|
|
|
|
if (innerStat.isDirectory()) {
|
|
|
|
if (!(await this.isDirectoryEmpty(`${dirPath}/${innerStat.path}`))) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
} else if (supportedFileExtension.indexOf(fileExtension(innerStat.path).toLowerCase()) >= 0) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2021-08-22 16:35:45 -07:00
|
|
|
private trimAnchorLink(link: string) {
|
|
|
|
if (link.indexOf('#') <= 0) return link;
|
|
|
|
|
|
|
|
const splitted = link.split('#');
|
|
|
|
splitted.pop();
|
|
|
|
return splitted.join('#');
|
|
|
|
}
|
|
|
|
|
2023-06-30 09:55:56 +01:00
|
|
|
// Parse text for links, attempt to find local file, if found create Joplin resource
|
|
|
|
// and update link accordingly.
|
2023-03-06 14:22:01 +00:00
|
|
|
public async importLocalFiles(filePath: string, md: string, parentFolderId: string) {
|
Desktop: when importing MD files create resources for local linked files (#2262)
* md importer: first pass import attachment resources with markdown files
* md importer: import resources from md - no unneeded saves, check if files exist, regex name
* md importer: test import of local files as resources, separate method for importing linked files, comment regex matching md tags
* md importer: move stateful regex to method scope, remove spurius await
* md importer: lint
* md importer: respond to PR comments: remove test nesting, test sample, check if path is dir, use shim.fsDriver
* md importer: use file-path methods for getting attachment path
* md importer: use extractImageUrls helper, test for file with zero links
* md importer: try catch around importLocalImages, improve test
* md importer: importing attached images cover case where link also appears elsewhere in doc
* md importer: only create 1 resource if note contains duplicate links, test
* md importer: remove log
* md importer: remove use of lodash
2020-01-19 15:39:38 +00:00
|
|
|
let updated = md;
|
2021-08-22 16:35:45 -07:00
|
|
|
const markdownLinks = markdownUtils.extractFileUrls(md);
|
|
|
|
const htmlLinks = htmlUtils.extractFileUrls(md);
|
|
|
|
const fileLinks = unique(markdownLinks.concat(htmlLinks));
|
2021-05-19 23:22:03 +02:00
|
|
|
await Promise.all(fileLinks.map(async (encodedLink: string) => {
|
2020-03-27 12:20:38 +00:00
|
|
|
const link = decodeURI(encodedLink);
|
2021-08-22 16:35:45 -07:00
|
|
|
// Handle anchor links appropriately
|
|
|
|
const trimmedLink = this.trimAnchorLink(link);
|
|
|
|
const attachmentPath = filename(`${dirname(filePath)}/${trimmedLink}`, true);
|
|
|
|
const pathWithExtension = `${attachmentPath}.${fileExtension(trimmedLink)}`;
|
Desktop: when importing MD files create resources for local linked files (#2262)
* md importer: first pass import attachment resources with markdown files
* md importer: import resources from md - no unneeded saves, check if files exist, regex name
* md importer: test import of local files as resources, separate method for importing linked files, comment regex matching md tags
* md importer: move stateful regex to method scope, remove spurius await
* md importer: lint
* md importer: respond to PR comments: remove test nesting, test sample, check if path is dir, use shim.fsDriver
* md importer: use file-path methods for getting attachment path
* md importer: use extractImageUrls helper, test for file with zero links
* md importer: try catch around importLocalImages, improve test
* md importer: importing attached images cover case where link also appears elsewhere in doc
* md importer: only create 1 resource if note contains duplicate links, test
* md importer: remove log
* md importer: remove use of lodash
2020-01-19 15:39:38 +00:00
|
|
|
const stat = await shim.fsDriver().stat(pathWithExtension);
|
|
|
|
const isDir = stat ? stat.isDirectory() : false;
|
|
|
|
if (stat && !isDir) {
|
2021-08-22 16:35:45 -07:00
|
|
|
const supportedFileExtension = this.metadata().fileExtensions;
|
|
|
|
const resolvedPath = shim.fsDriver().resolve(pathWithExtension);
|
2023-02-05 11:32:28 +00:00
|
|
|
let id = '';
|
2021-08-22 16:35:45 -07:00
|
|
|
// If the link looks like a note, then import it
|
|
|
|
if (supportedFileExtension.indexOf(fileExtension(trimmedLink).toLowerCase()) >= 0) {
|
|
|
|
// If the note hasn't been imported yet, do so now
|
|
|
|
if (!this.importedNotes[resolvedPath]) {
|
|
|
|
await this.importFile(resolvedPath, parentFolderId);
|
|
|
|
}
|
|
|
|
|
|
|
|
id = this.importedNotes[resolvedPath].id;
|
|
|
|
} else {
|
|
|
|
const resource = await shim.createResourceFromPath(pathWithExtension);
|
|
|
|
id = resource.id;
|
|
|
|
}
|
|
|
|
|
|
|
|
// The first is a normal link, the second is supports the <link> and [](<link with spaces>) syntax
|
|
|
|
// Only opening patterns are consider in order to cover all occurances
|
|
|
|
// We need to use the encoded link as well because some links (link's with spaces)
|
|
|
|
// will appear encoded in the source. Other links (unicode chars) will not
|
|
|
|
const linksToReplace = [this.trimAnchorLink(link), this.trimAnchorLink(encodedLink)];
|
|
|
|
|
|
|
|
for (let j = 0; j < linksToReplace.length; j++) {
|
|
|
|
const linkToReplace = pregQuote(linksToReplace[j]);
|
|
|
|
|
|
|
|
// Markdown links
|
|
|
|
updated = markdownUtils.replaceResourceUrl(updated, linkToReplace, id);
|
|
|
|
|
|
|
|
// HTML links
|
|
|
|
updated = htmlUtils.replaceResourceUrl(updated, linkToReplace, id);
|
|
|
|
}
|
Desktop: when importing MD files create resources for local linked files (#2262)
* md importer: first pass import attachment resources with markdown files
* md importer: import resources from md - no unneeded saves, check if files exist, regex name
* md importer: test import of local files as resources, separate method for importing linked files, comment regex matching md tags
* md importer: move stateful regex to method scope, remove spurius await
* md importer: lint
* md importer: respond to PR comments: remove test nesting, test sample, check if path is dir, use shim.fsDriver
* md importer: use file-path methods for getting attachment path
* md importer: use extractImageUrls helper, test for file with zero links
* md importer: try catch around importLocalImages, improve test
* md importer: importing attached images cover case where link also appears elsewhere in doc
* md importer: only create 1 resource if note contains duplicate links, test
* md importer: remove log
* md importer: remove use of lodash
2020-01-19 15:39:38 +00:00
|
|
|
}
|
|
|
|
}));
|
|
|
|
return updated;
|
|
|
|
}
|
|
|
|
|
2023-03-06 14:22:01 +00:00
|
|
|
public async importFile(filePath: string, parentFolderId: string) {
|
2021-08-22 16:35:45 -07:00
|
|
|
const resolvedPath = shim.fsDriver().resolve(filePath);
|
|
|
|
if (this.importedNotes[resolvedPath]) return this.importedNotes[resolvedPath];
|
|
|
|
|
|
|
|
const stat = await shim.fsDriver().stat(resolvedPath);
|
|
|
|
if (!stat) throw new Error(`Cannot read ${resolvedPath}`);
|
|
|
|
const ext = fileExtension(resolvedPath);
|
|
|
|
const title = filename(resolvedPath);
|
|
|
|
const body = await shim.fsDriver().readFile(resolvedPath);
|
2018-09-09 20:32:23 +01:00
|
|
|
const note = {
|
|
|
|
parent_id: parentFolderId,
|
|
|
|
title: title,
|
2021-08-22 16:35:45 -07:00
|
|
|
body: body,
|
2018-09-09 20:32:23 +01:00
|
|
|
updated_time: stat.mtime.getTime(),
|
|
|
|
created_time: stat.birthtime.getTime(),
|
|
|
|
user_updated_time: stat.mtime.getTime(),
|
|
|
|
user_created_time: stat.birthtime.getTime(),
|
2021-08-22 16:35:45 -07:00
|
|
|
markup_language: ext === 'html' ? MarkupToHtml.MARKUP_LANGUAGE_HTML : MarkupToHtml.MARKUP_LANGUAGE_MARKDOWN,
|
2018-09-09 20:32:23 +01:00
|
|
|
};
|
2021-08-22 16:35:45 -07:00
|
|
|
this.importedNotes[resolvedPath] = await Note.save(note, { autoTimestamp: false });
|
|
|
|
|
|
|
|
try {
|
|
|
|
const updatedBody = await this.importLocalFiles(resolvedPath, body, parentFolderId);
|
|
|
|
const updatedNote = {
|
|
|
|
...this.importedNotes[resolvedPath],
|
|
|
|
body: updatedBody || body,
|
|
|
|
};
|
|
|
|
this.importedNotes[resolvedPath] = await Note.save(updatedNote, { isNew: false });
|
|
|
|
} catch (error) {
|
|
|
|
// console.error(`Problem importing links for file ${resolvedPath}, error:\n ${error}`);
|
|
|
|
}
|
Desktop: when importing MD files create resources for local linked files (#2262)
* md importer: first pass import attachment resources with markdown files
* md importer: import resources from md - no unneeded saves, check if files exist, regex name
* md importer: test import of local files as resources, separate method for importing linked files, comment regex matching md tags
* md importer: move stateful regex to method scope, remove spurius await
* md importer: lint
* md importer: respond to PR comments: remove test nesting, test sample, check if path is dir, use shim.fsDriver
* md importer: use file-path methods for getting attachment path
* md importer: use extractImageUrls helper, test for file with zero links
* md importer: try catch around importLocalImages, improve test
* md importer: importing attached images cover case where link also appears elsewhere in doc
* md importer: only create 1 resource if note contains duplicate links, test
* md importer: remove log
* md importer: remove use of lodash
2020-01-19 15:39:38 +00:00
|
|
|
|
2021-08-22 16:35:45 -07:00
|
|
|
return this.importedNotes[resolvedPath];
|
2018-09-09 20:32:23 +01:00
|
|
|
}
|
2018-02-26 19:25:54 +00:00
|
|
|
}
|