2020-10-09 18:35:46 +01:00
import { ModuleType , FileSystemItem , ImportModuleOutputFormat , Module , ImportOptions , ExportOptions , ImportExportResult , defaultImportExportModule } from './types' ;
import InteropService_Importer_Custom from './InteropService_Importer_Custom' ;
import InteropService_Exporter_Custom from './InteropService_Exporter_Custom' ;
2020-11-05 16:58:23 +00:00
import shim from '../../shim' ;
import { _ } from '../../locale' ;
2021-01-22 17:41:11 +00:00
import BaseItem from '../../models/BaseItem' ;
import BaseModel from '../../BaseModel' ;
import Resource from '../../models/Resource' ;
import Folder from '../../models/Folder' ;
import NoteTag from '../../models/NoteTag' ;
import Note from '../../models/Note' ;
2020-11-05 16:58:23 +00:00
const ArrayUtils = require ( '../../ArrayUtils' ) ;
2018-03-09 20:59:12 +00:00
const { sprintf } = require ( 'sprintf-js' ) ;
2020-11-05 16:58:23 +00:00
const { fileExtension } = require ( '../../path-utils' ) ;
const { toTitleCase } = require ( '../../string-utils' ) ;
2020-10-09 18:35:46 +01:00
const EventEmitter = require ( 'events' ) ;
export default class InteropService {
2020-11-12 19:13:28 +00:00
private defaultModules_ : Module [ ] ;
private userModules_ : Module [ ] = [ ] ;
private eventEmitter_ : any = null ;
private static instance_ : InteropService ;
2020-10-09 18:35:46 +01:00
2020-11-12 19:13:28 +00:00
public static instance ( ) : InteropService {
2020-10-09 18:35:46 +01:00
if ( ! this . instance_ ) this . instance_ = new InteropService ( ) ;
return this . instance_ ;
}
2018-02-25 17:01:16 +00:00
2018-02-27 20:04:38 +00:00
constructor ( ) {
2020-10-09 18:35:46 +01:00
this . eventEmitter_ = new EventEmitter ( ) ;
}
2020-11-12 19:13:28 +00:00
on ( eventName : string , callback : Function ) {
2020-10-09 18:35:46 +01:00
return this . eventEmitter_ . on ( eventName , callback ) ;
}
2020-11-12 19:13:28 +00:00
off ( eventName : string , callback : Function ) {
2020-10-09 18:35:46 +01:00
return this . eventEmitter_ . removeListener ( eventName , callback ) ;
2019-09-29 22:11:36 +00:00
}
2018-02-27 20:04:38 +00:00
modules() {
2020-10-09 18:35:46 +01:00
if ( ! this . defaultModules_ ) {
2020-11-12 19:13:28 +00:00
const importModules : Module [ ] = [
2019-07-29 15:43:53 +02:00
{
2020-10-09 18:35:46 +01:00
. . . defaultImportExportModule ( ModuleType . Importer ) ,
format : 'jex' ,
fileExtensions : [ 'jex' ] ,
sources : [ FileSystemItem . File ] ,
description : _ ( 'Joplin Export File' ) ,
2019-07-29 15:43:53 +02:00
} ,
2020-10-09 18:35:46 +01:00
{
. . . defaultImportExportModule ( ModuleType . Importer ) ,
format : 'md' ,
fileExtensions : [ 'md' , 'markdown' , 'txt' ] ,
sources : [ FileSystemItem . File , FileSystemItem . Directory ] ,
isNoteArchive : false , // Tells whether the file can contain multiple notes (eg. Enex or Jex format)
description : _ ( 'Markdown' ) ,
} ,
{
. . . defaultImportExportModule ( ModuleType . Importer ) ,
format : 'raw' ,
sources : [ FileSystemItem . Directory ] ,
description : _ ( 'Joplin Export Directory' ) ,
} ,
{
. . . defaultImportExportModule ( ModuleType . Importer ) ,
format : 'enex' ,
fileExtensions : [ 'enex' ] ,
sources : [ FileSystemItem . File ] ,
description : _ ( 'Evernote Export File (as Markdown)' ) ,
importerClass : 'InteropService_Importer_EnexToMd' ,
isDefault : true ,
} ,
{
. . . defaultImportExportModule ( ModuleType . Importer ) ,
format : 'enex' ,
fileExtensions : [ 'enex' ] ,
sources : [ FileSystemItem . File ] ,
description : _ ( 'Evernote Export File (as HTML)' ) ,
// TODO: Consider doing this the same way as the multiple `md` importers are handled
importerClass : 'InteropService_Importer_EnexToHtml' ,
outputFormat : ImportModuleOutputFormat.Html ,
} ,
] ;
2018-02-27 20:04:38 +00:00
2020-11-12 19:13:28 +00:00
const exportModules : Module [ ] = [
2020-10-09 18:35:46 +01:00
{
. . . defaultImportExportModule ( ModuleType . Exporter ) ,
format : 'jex' ,
fileExtensions : [ 'jex' ] ,
target : FileSystemItem.File ,
description : _ ( 'Joplin Export File' ) ,
} ,
{
. . . defaultImportExportModule ( ModuleType . Exporter ) ,
format : 'raw' ,
target : FileSystemItem.Directory ,
description : _ ( 'Joplin Export Directory' ) ,
} ,
{
. . . defaultImportExportModule ( ModuleType . Exporter ) ,
format : 'md' ,
target : FileSystemItem.Directory ,
description : _ ( 'Markdown' ) ,
} ,
{
. . . defaultImportExportModule ( ModuleType . Exporter ) ,
format : 'html' ,
fileExtensions : [ 'html' , 'htm' ] ,
target : FileSystemItem.File ,
isNoteArchive : false ,
description : _ ( 'HTML File' ) ,
} ,
{
. . . defaultImportExportModule ( ModuleType . Exporter ) ,
format : 'html' ,
target : FileSystemItem.Directory ,
description : _ ( 'HTML Directory' ) ,
} ,
] ;
2018-03-12 18:01:47 +00:00
2020-10-09 18:35:46 +01:00
this . defaultModules_ = importModules . concat ( exportModules ) ;
}
2018-02-27 20:04:38 +00:00
2020-10-09 18:35:46 +01:00
return this . defaultModules_ . concat ( this . userModules_ ) ;
}
2020-11-12 19:13:28 +00:00
public registerModule ( module : Module ) {
2020-10-09 18:35:46 +01:00
module = {
. . . defaultImportExportModule ( module . type ) ,
. . . module ,
} ;
this . userModules_ . push ( module ) ;
this . eventEmitter_ . emit ( 'modulesChanged' ) ;
2018-02-27 20:04:38 +00:00
}
2019-09-23 14:18:30 -07:00
// Find the module that matches the given type ("importer" or "exporter")
// and the given format. Some formats can have multiple assocated importers
// or exporters, such as ENEX. In this case, the one marked as "isDefault"
// is returned. This is useful to auto-detect the module based on the format.
// For more precise matching, newModuleFromPath_ should be used.
2020-11-12 19:13:28 +00:00
findModuleByFormat_ ( type : ModuleType , format : string , target : FileSystemItem = null , outputFormat : ImportModuleOutputFormat = null ) {
2018-02-27 20:04:38 +00:00
const modules = this . modules ( ) ;
2019-09-23 14:18:30 -07:00
const matches = [ ] ;
2018-02-27 20:04:38 +00:00
for ( let i = 0 ; i < modules . length ; i ++ ) {
const m = modules [ i ] ;
2019-12-15 18:41:13 +00:00
if ( m . format === format && m . type === type ) {
2020-06-14 16:45:17 +00:00
if ( ! target && ! outputFormat ) {
2019-12-15 18:41:13 +00:00
matches . push ( m ) ;
2020-06-14 16:45:17 +00:00
} else if ( target && target === m . target ) {
matches . push ( m ) ;
} else if ( outputFormat && outputFormat === m . outputFormat ) {
2019-12-15 18:41:13 +00:00
matches . push ( m ) ;
}
}
2018-02-26 19:16:01 +00:00
}
2019-09-23 14:18:30 -07:00
2020-05-21 09:14:33 +01:00
const output = matches . find ( m = > ! ! m . isDefault ) ;
2019-09-23 14:18:30 -07:00
if ( output ) return output ;
return matches . length ? matches [ 0 ] : null ;
2018-02-25 17:01:16 +00:00
}
2020-11-12 19:13:28 +00:00
private modulePath ( module : Module ) {
2020-10-09 18:35:46 +01:00
let className = '' ;
if ( module . type === ModuleType . Importer ) {
className = module . importerClass || ` InteropService_Importer_ ${ toTitleCase ( module . format ) } ` ;
} else {
className = ` InteropService_Exporter_ ${ toTitleCase ( module . format ) } ` ;
}
2020-11-05 16:58:23 +00:00
return ` ./ ${ className } ` ;
2020-10-09 18:35:46 +01:00
}
2020-11-12 19:13:28 +00:00
private newModuleFromCustomFactory ( module : Module ) {
2020-10-09 18:35:46 +01:00
if ( module . type === ModuleType . Importer ) {
return new InteropService_Importer_Custom ( module ) ;
} else {
return new InteropService_Exporter_Custom ( module ) ;
}
}
2019-09-23 14:18:30 -07:00
/ * *
* NOTE TO FUTURE SELF : It might make sense to simply move all the existing
* formatters to the ` newModuleFromPath_ ` approach , so that there ' s only one way
* to do this mapping . This isn ' t a priority right now ( per the convo in :
* https : //github.com/laurent22/joplin/pull/1795#discussion_r322379121) but
* we can do it if it ever becomes necessary .
* /
2020-11-12 19:13:28 +00:00
newModuleByFormat_ ( type : ModuleType , format : string , outputFormat : ImportModuleOutputFormat = ImportModuleOutputFormat . Markdown ) {
2020-06-14 16:45:17 +00:00
const moduleMetadata = this . findModuleByFormat_ ( type , format , null , outputFormat ) ;
if ( ! moduleMetadata ) throw new Error ( _ ( 'Cannot load "%s" module for format "%s" and output "%s"' , type , format , outputFormat ) ) ;
2020-10-09 18:35:46 +01:00
let output = null ;
if ( moduleMetadata . isCustom ) {
output = this . newModuleFromCustomFactory ( moduleMetadata ) ;
} else {
2021-01-27 17:42:58 +00:00
const ModuleClass = shim . requireDynamic ( this . modulePath ( moduleMetadata ) ) . default ;
2020-10-09 18:35:46 +01:00
output = new ModuleClass ( ) ;
}
2019-09-23 14:18:30 -07:00
output . setMetadata ( moduleMetadata ) ;
2020-10-09 18:35:46 +01:00
2019-09-23 14:18:30 -07:00
return output ;
}
/ * *
* The existing ` newModuleByFormat_ ` fn would load by the input format . This
* was fine when there was a 1 - 1 mapping of input formats to output formats ,
* but now that we have 2 possible outputs for an ` enex ` input , we need to be
* explicit with which importer we want to use .
*
* https : //github.com/laurent22/joplin/pull/1795#pullrequestreview-281574417
* /
2020-11-12 19:13:28 +00:00
newModuleFromPath_ ( type : ModuleType , options : any ) {
2019-12-15 18:41:13 +00:00
const moduleMetadata = this . findModuleByFormat_ ( type , options . format , options . target ) ;
2020-11-17 14:50:28 +00:00
if ( ! moduleMetadata ) throw new Error ( _ ( 'Cannot load "%s" module for format "%s" and target "%s"' , type , options . format , options . target ) ) ;
2020-10-09 18:35:46 +01:00
let output = null ;
if ( moduleMetadata . isCustom ) {
output = this . newModuleFromCustomFactory ( moduleMetadata ) ;
} else {
2020-11-17 14:50:28 +00:00
const modulePath = this . modulePath ( moduleMetadata ) ;
2021-01-27 17:42:58 +00:00
const ModuleClass = shim . requireDynamic ( modulePath ) . default ;
2020-10-09 18:35:46 +01:00
output = new ModuleClass ( ) ;
}
output . setMetadata ( { options , . . . moduleMetadata } ) ;
2018-06-26 00:07:53 +01:00
return output ;
2020-11-17 14:50:28 +00:00
// let modulePath = options && options.modulePath ? options.modulePath : '';
// if (!modulePath) {
// const moduleMetadata = this.findModuleByFormat_(type, options.format, options.target);
// if (!moduleMetadata) throw new Error(_('Cannot load "%s" module for format "%s" and target "%s"', type, options.format, options.target));
// modulePath = this.modulePath(moduleMetadata);
// }
// const moduleMetadata = this.findModuleByFormat_(type, options.format, options.target);
// let output = null;
// if (moduleMetadata.isCustom) {
// output = this.newModuleFromCustomFactory(moduleMetadata);
// } else {
2021-01-27 17:42:58 +00:00
// const ModuleClass = shim.requireDynamic(modulePath).default;
2020-11-17 14:50:28 +00:00
// output = new ModuleClass();
// }
// output.setMetadata({ options, ...moduleMetadata });
// return output;
2018-02-26 18:43:50 +00:00
}
2020-11-12 19:13:28 +00:00
moduleByFileExtension_ ( type : ModuleType , ext : string ) {
2018-02-27 20:04:38 +00:00
ext = ext . toLowerCase ( ) ;
const modules = this . modules ( ) ;
for ( let i = 0 ; i < modules . length ; i ++ ) {
const m = modules [ i ] ;
if ( type !== m . type ) continue ;
2019-07-13 17:26:47 +01:00
if ( m . fileExtensions && m . fileExtensions . indexOf ( ext ) >= 0 ) return m ;
2018-02-27 20:04:38 +00:00
}
return null ;
2018-02-26 19:16:01 +00:00
}
2020-11-12 19:13:28 +00:00
async import ( options : ImportOptions ) : Promise < ImportExportResult > {
2019-07-29 15:43:53 +02:00
if ( ! ( await shim . fsDriver ( ) . exists ( options . path ) ) ) throw new Error ( _ ( 'Cannot find "%s".' , options . path ) ) ;
2018-02-26 19:16:01 +00:00
2020-10-09 18:35:46 +01:00
options = {
format : 'auto' ,
destinationFolderId : null ,
destinationFolder : null ,
. . . options ,
} ;
2018-02-25 17:01:16 +00:00
2018-03-09 20:59:12 +00:00
if ( options . format === 'auto' ) {
2020-10-09 18:35:46 +01:00
const module = this . moduleByFileExtension_ ( ModuleType . Importer , fileExtension ( options . path ) ) ;
2018-03-09 20:59:12 +00:00
if ( ! module ) throw new Error ( _ ( 'Please specify import format for %s' , options . path ) ) ;
2019-07-30 09:35:42 +02:00
// eslint-disable-next-line require-atomic-updates
2018-02-27 20:04:38 +00:00
options . format = module . format ;
2018-02-25 17:01:16 +00:00
}
if ( options . destinationFolderId ) {
const folder = await Folder . load ( options . destinationFolderId ) ;
2018-02-27 20:04:38 +00:00
if ( ! folder ) throw new Error ( _ ( 'Cannot find "%s".' , options . destinationFolderId ) ) ;
2019-07-30 09:35:42 +02:00
// eslint-disable-next-line require-atomic-updates
2018-02-26 18:43:50 +00:00
options . destinationFolder = folder ;
2018-02-25 17:01:16 +00:00
}
2020-11-12 19:13:28 +00:00
let result : ImportExportResult = { warnings : [ ] } ;
2018-02-25 17:01:16 +00:00
2020-11-17 14:50:28 +00:00
// let importer = null;
//
2020-10-17 11:35:51 +01:00
// Not certain the "modulePath" property still has any use at this point. Modules should be looked up
// based on their format and outputFormat.
2020-11-17 14:50:28 +00:00
// if (options.modulePath) {
// importer = this.newModuleFromPath_(ModuleType.Importer, options);
// } else {
// importer = this.newModuleByFormat_(ModuleType.Importer, options.format, options.outputFormat);
// }
const importer = this . newModuleByFormat_ ( ModuleType . Importer , options . format , options . outputFormat ) ;
2019-09-23 14:18:30 -07:00
2018-02-26 18:43:50 +00:00
await importer . init ( options . path , options ) ;
result = await importer . exec ( result ) ;
2018-02-25 17:01:16 +00:00
return result ;
2018-02-23 19:32:19 +00:00
}
2020-11-12 19:13:28 +00:00
async export ( options : ExportOptions ) : Promise < ImportExportResult > {
2020-10-09 18:35:46 +01:00
options = {
format : 'jex' ,
. . . options ,
} ;
2019-12-15 18:41:13 +00:00
2018-02-23 19:32:19 +00:00
const exportPath = options . path ? options.path : null ;
2018-06-10 19:15:40 +01:00
let sourceFolderIds = options . sourceFolderIds ? options . sourceFolderIds : [ ] ;
2018-02-23 19:32:19 +00:00
const sourceNoteIds = options . sourceNoteIds ? options . sourceNoteIds : [ ] ;
2020-11-12 19:13:28 +00:00
const result : ImportExportResult = { warnings : [ ] } ;
const itemsToExport : any [ ] = [ ] ;
2018-02-23 19:32:19 +00:00
2020-11-12 19:13:28 +00:00
const queueExportItem = ( itemType : number , itemOrId : any ) = > {
2018-02-23 19:32:19 +00:00
itemsToExport . push ( {
type : itemType ,
2019-07-29 15:43:53 +02:00
itemOrId : itemOrId ,
2018-02-23 19:32:19 +00:00
} ) ;
2019-07-29 15:43:53 +02:00
} ;
2018-02-23 19:32:19 +00:00
2020-03-13 23:46:14 +00:00
const exportedNoteIds = [ ] ;
2020-11-12 19:13:28 +00:00
let resourceIds : string [ ] = [ ] ;
2020-09-07 22:12:51 +01:00
// Recursively get all the folders that have valid parents
2021-01-22 17:41:11 +00:00
const folderIds = await Folder . childrenIds ( '' ) ;
2018-02-23 19:32:19 +00:00
2020-11-17 11:50:46 +00:00
if ( options . includeConflicts ) folderIds . push ( Folder . conflictFolderId ( ) ) ;
2018-06-10 19:15:40 +01:00
let fullSourceFolderIds = sourceFolderIds . slice ( ) ;
for ( let i = 0 ; i < sourceFolderIds . length ; i ++ ) {
const id = sourceFolderIds [ i ] ;
const childrenIds = await Folder . childrenIds ( id ) ;
fullSourceFolderIds = fullSourceFolderIds . concat ( childrenIds ) ;
}
sourceFolderIds = fullSourceFolderIds ;
2018-02-23 19:32:19 +00:00
for ( let folderIndex = 0 ; folderIndex < folderIds . length ; folderIndex ++ ) {
const folderId = folderIds [ folderIndex ] ;
if ( sourceFolderIds . length && sourceFolderIds . indexOf ( folderId ) < 0 ) continue ;
if ( ! sourceNoteIds . length ) await queueExportItem ( BaseModel . TYPE_FOLDER , folderId ) ;
2020-11-17 11:50:46 +00:00
const noteIds = await Folder . noteIds ( folderId , { includeConflicts : ! ! options . includeConflicts } ) ;
2018-02-23 19:32:19 +00:00
for ( let noteIndex = 0 ; noteIndex < noteIds . length ; noteIndex ++ ) {
const noteId = noteIds [ noteIndex ] ;
if ( sourceNoteIds . length && sourceNoteIds . indexOf ( noteId ) < 0 ) continue ;
const note = await Note . load ( noteId ) ;
await queueExportItem ( BaseModel . TYPE_NOTE , note ) ;
exportedNoteIds . push ( noteId ) ;
2018-05-03 13:11:45 +01:00
const rids = await Note . linkedResourceIds ( note . body ) ;
2018-02-23 19:32:19 +00:00
resourceIds = resourceIds . concat ( rids ) ;
}
}
2018-02-26 19:25:54 +00:00
resourceIds = ArrayUtils . unique ( resourceIds ) ;
2018-02-23 19:32:19 +00:00
for ( let i = 0 ; i < resourceIds . length ; i ++ ) {
await queueExportItem ( BaseModel . TYPE_RESOURCE , resourceIds [ i ] ) ;
}
const noteTags = await NoteTag . all ( ) ;
2020-03-13 23:46:14 +00:00
const exportedTagIds = [ ] ;
2018-02-23 19:32:19 +00:00
for ( let i = 0 ; i < noteTags . length ; i ++ ) {
const noteTag = noteTags [ i ] ;
if ( exportedNoteIds . indexOf ( noteTag . note_id ) < 0 ) continue ;
await queueExportItem ( BaseModel . TYPE_NOTE_TAG , noteTag . id ) ;
exportedTagIds . push ( noteTag . tag_id ) ;
}
for ( let i = 0 ; i < exportedTagIds . length ; i ++ ) {
await queueExportItem ( BaseModel . TYPE_TAG , exportedTagIds [ i ] ) ;
}
2020-10-09 18:35:46 +01:00
const exporter = this . newModuleFromPath_ ( ModuleType . Exporter , options ) ;
2020-01-24 21:46:48 +00:00
await exporter . init ( exportPath , options ) ;
2018-02-23 19:32:19 +00:00
2018-11-21 00:36:23 +00:00
const typeOrder = [ BaseModel . TYPE_FOLDER , BaseModel . TYPE_RESOURCE , BaseModel . TYPE_NOTE , BaseModel . TYPE_TAG , BaseModel . TYPE_NOTE_TAG ] ;
2020-11-12 19:13:28 +00:00
const context : any = {
2018-11-21 00:36:23 +00:00
resourcePaths : { } ,
} ;
for ( let typeOrderIndex = 0 ; typeOrderIndex < typeOrder . length ; typeOrderIndex ++ ) {
const type = typeOrder [ typeOrderIndex ] ;
2020-01-18 14:16:14 +01:00
await exporter . prepareForProcessingItemType ( type , itemsToExport ) ;
2018-11-21 00:36:23 +00:00
for ( let i = 0 ; i < itemsToExport . length ; i ++ ) {
const itemType = itemsToExport [ i ] . type ;
if ( itemType !== type ) continue ;
const ItemClass = BaseItem . getClassByItemType ( itemType ) ;
const itemOrId = itemsToExport [ i ] . itemOrId ;
const item = typeof itemOrId === 'object' ? itemOrId : await ItemClass . load ( itemOrId ) ;
if ( ! item ) {
if ( itemType === BaseModel . TYPE_RESOURCE ) {
result . warnings . push ( sprintf ( 'A resource that does not exist is referenced in a note. The resource was skipped. Resource ID: %s' , itemOrId ) ) ;
} else {
result . warnings . push ( sprintf ( 'Cannot find item with type "%s" and ID %s. Item was skipped.' , ItemClass . tableName ( ) , JSON . stringify ( itemOrId ) ) ) ;
}
continue ;
2018-02-23 19:32:19 +00:00
}
2020-09-17 10:00:13 +01:00
if ( item . encryption_applied || item . encryption_blob_encrypted ) {
result . warnings . push ( sprintf ( 'This item is currently encrypted: %s "%s" (%s) and was not exported. You may wait for it to be decrypted and try again.' , BaseModel . modelTypeToName ( itemType ) , item . title ? item.title : item.id , item . id ) ) ;
continue ;
}
2018-02-27 20:51:07 +00:00
2018-11-21 00:36:23 +00:00
try {
if ( itemType == BaseModel . TYPE_RESOURCE ) {
const resourcePath = Resource . fullPath ( item ) ;
context . resourcePaths [ item . id ] = resourcePath ;
exporter . updateContext ( context ) ;
await exporter . processResource ( item , resourcePath ) ;
}
2018-02-23 19:32:19 +00:00
2020-10-09 18:35:46 +01:00
await exporter . processItem ( itemType , item ) ;
2018-11-21 00:36:23 +00:00
} catch ( error ) {
2019-12-15 18:41:13 +00:00
console . error ( error ) ;
2018-11-21 00:36:23 +00:00
result . warnings . push ( error . message ) ;
}
2018-02-23 19:32:19 +00:00
}
}
await exporter . close ( ) ;
return result ;
}
}