2019-07-30 09:35:42 +02:00
|
|
|
/* eslint-disable no-unused-vars */
|
|
|
|
|
2018-05-12 12:48:39 +02:00
|
|
|
|
2018-11-08 01:35:14 +02:00
|
|
|
const os = require('os');
|
2020-11-07 17:59:37 +02:00
|
|
|
const time = require('@joplin/lib/time').default;
|
|
|
|
const { filename } = require('@joplin/lib/path-utils');
|
2020-11-05 18:58:23 +02:00
|
|
|
const { asyncTest, fileContentEqual, setupDatabase, setupDatabaseAndSynchronizer, db, synchronizer, fileApi, sleep, clearDatabase, switchClient, syncTargetId, objectsEqual, checkThrowAsync } = require('./test-utils.js');
|
2020-11-07 17:59:37 +02:00
|
|
|
const Folder = require('@joplin/lib/models/Folder.js');
|
|
|
|
const Note = require('@joplin/lib/models/Note.js');
|
|
|
|
const BaseModel = require('@joplin/lib/BaseModel').default;
|
|
|
|
const shim = require('@joplin/lib/shim').default;
|
|
|
|
const HtmlToMd = require('@joplin/lib/HtmlToMd');
|
|
|
|
const { enexXmlToMd } = require('@joplin/lib/import-enex-md-gen.js');
|
2018-05-12 12:48:39 +02:00
|
|
|
|
|
|
|
process.on('unhandledRejection', (reason, p) => {
|
|
|
|
console.log('Unhandled Rejection at: Promise', p, 'reason:', reason);
|
|
|
|
});
|
|
|
|
|
|
|
|
describe('HtmlToMd', function() {
|
|
|
|
|
|
|
|
beforeEach(async (done) => {
|
|
|
|
await setupDatabaseAndSynchronizer(1);
|
|
|
|
await switchClient(1);
|
|
|
|
done();
|
|
|
|
});
|
|
|
|
|
2018-05-22 01:54:23 +02:00
|
|
|
it('should convert from Html to Markdown', asyncTest(async () => {
|
2019-09-19 23:51:18 +02:00
|
|
|
const basePath = `${__dirname}/html_to_md`;
|
2018-05-12 12:48:39 +02:00
|
|
|
const files = await shim.fsDriver().readDirStats(basePath);
|
2018-05-20 11:19:59 +02:00
|
|
|
const htmlToMd = new HtmlToMd();
|
2019-07-30 09:35:42 +02:00
|
|
|
|
2018-05-12 12:48:39 +02:00
|
|
|
for (let i = 0; i < files.length; i++) {
|
|
|
|
const htmlFilename = files[i].path;
|
|
|
|
if (htmlFilename.indexOf('.html') < 0) continue;
|
|
|
|
|
2019-09-19 23:51:18 +02:00
|
|
|
const htmlPath = `${basePath}/${htmlFilename}`;
|
|
|
|
const mdPath = `${basePath}/${filename(htmlFilename)}.md`;
|
2018-05-12 12:48:39 +02:00
|
|
|
|
2020-03-10 01:24:57 +02:00
|
|
|
// if (htmlFilename !== 'joplin_source_2.html') continue;
|
|
|
|
|
|
|
|
// if (htmlFilename.indexOf('image_preserve_size') !== 0) continue;
|
2019-06-13 01:26:09 +02:00
|
|
|
|
2019-07-30 09:35:42 +02:00
|
|
|
const htmlToMdOptions = {};
|
2019-06-13 01:26:09 +02:00
|
|
|
|
|
|
|
if (htmlFilename === 'anchor_local.html') {
|
|
|
|
// Normally the list of anchor names in the document are retrieved from the HTML code
|
|
|
|
// This is straightforward when the document is still in DOM format, as with the clipper,
|
|
|
|
// but otherwise it would need to be somehow parsed out from the HTML. Here we just
|
|
|
|
// hard code the anchors that we know are in the file.
|
2019-10-12 00:18:40 +02:00
|
|
|
htmlToMdOptions.anchorNames = ['first', 'second', 'fourth'];
|
2019-06-13 01:26:09 +02:00
|
|
|
}
|
2018-05-12 12:48:39 +02:00
|
|
|
|
2020-03-10 01:24:57 +02:00
|
|
|
if (htmlFilename.indexOf('image_preserve_size') === 0) {
|
|
|
|
htmlToMdOptions.preserveImageTagsWithSize = true;
|
|
|
|
}
|
|
|
|
|
2018-05-12 12:48:39 +02:00
|
|
|
const html = await shim.fsDriver().readFile(htmlPath);
|
2018-11-08 01:35:14 +02:00
|
|
|
let expectedMd = await shim.fsDriver().readFile(mdPath);
|
2018-05-12 12:48:39 +02:00
|
|
|
|
2019-09-19 23:51:18 +02:00
|
|
|
let actualMd = await htmlToMd.parse(`<div>${html}</div>`, htmlToMdOptions);
|
2018-11-08 01:35:14 +02:00
|
|
|
|
|
|
|
if (os.EOL === '\r\n') {
|
2019-07-30 09:35:42 +02:00
|
|
|
expectedMd = expectedMd.replace(/\r\n/g, '\n');
|
|
|
|
actualMd = actualMd.replace(/\r\n/g, '\n');
|
2018-11-08 01:35:14 +02:00
|
|
|
}
|
2018-05-12 12:48:39 +02:00
|
|
|
|
|
|
|
if (actualMd !== expectedMd) {
|
|
|
|
console.info('');
|
2019-09-19 23:51:18 +02:00
|
|
|
console.info(`Error converting file: ${htmlFilename}`);
|
2018-05-12 12:48:39 +02:00
|
|
|
console.info('--------------------------------- Got:');
|
2018-05-22 01:54:23 +02:00
|
|
|
console.info(actualMd);
|
|
|
|
console.info('--------------------------------- Raw:');
|
2018-05-14 12:36:02 +02:00
|
|
|
console.info(actualMd.split('\n'));
|
2018-05-12 12:48:39 +02:00
|
|
|
console.info('--------------------------------- Expected:');
|
2018-05-14 12:36:02 +02:00
|
|
|
console.info(expectedMd.split('\n'));
|
2018-05-12 12:48:39 +02:00
|
|
|
console.info('--------------------------------------------');
|
|
|
|
console.info('');
|
|
|
|
|
|
|
|
expect(false).toBe(true);
|
2018-05-14 19:46:04 +02:00
|
|
|
// return;
|
2018-05-12 12:48:39 +02:00
|
|
|
} else {
|
2019-07-30 09:35:42 +02:00
|
|
|
expect(true).toBe(true);
|
2018-05-12 12:48:39 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}));
|
|
|
|
|
2019-07-30 09:35:42 +02:00
|
|
|
});
|