simpler ENEX parsing

This commit is contained in:
zadam 2019-11-16 17:56:49 +01:00
parent f9b5e473f2
commit 95d0ad1cad
2 changed files with 13 additions and 28 deletions

View file

@ -74,8 +74,7 @@
"turndown": "5.0.3",
"turndown-plugin-gfm": "1.0.2",
"unescape": "1.0.1",
"ws": "7.2.0",
"xml2js": "0.4.22"
"ws": "7.2.0"
},
"devDependencies": {
"electron": "6.0.12",

View file

@ -1,7 +1,6 @@
const sax = require("sax");
const fileType = require('file-type');
const stream = require('stream');
const xml2js = require('xml2js');
const log = require("../log");
const utils = require("../utils");
const noteService = require("../notes");
@ -22,8 +21,6 @@ let resource;
async function importEnex(taskContext, file, parentNote) {
const saxStream = sax.createStream(true);
const xmlBuilder = new xml2js.Builder({ headless: true });
const parser = new xml2js.Parser({ explicitArray: true });
const rootNoteTitle = file.originalname.toLowerCase().endsWith(".enex")
? file.originalname.substr(0, file.originalname.length - 5)
@ -40,28 +37,20 @@ async function importEnex(taskContext, file, parentNote) {
// when we finish parsing. We use this to be sure that all saving has been finished before returning successfully.
const saveNotePromises = [];
async function parseXml(text) {
return new Promise(function(resolve, reject)
{
parser.parseString(text, function (err, result) {
if (err) {
reject(err);
}
else {
resolve(result);
}
});
});
}
function extractContent(content) {
const openingNoteIndex = content.indexOf('<en-note>');
function extractContent(enNote) {
// [] thing is workaround for https://github.com/Leonidas-from-XIV/node-xml2js/issues/484
let content = xmlBuilder.buildObject([enNote]);
if (openingNoteIndex !== -1) {
content = content.substr(openingNoteIndex + 9);
}
const endOfFirstTagIndex = content.indexOf('>');
const closingNoteIndex = content.lastIndexOf('</en-note>');
// strip the <0> and </0> tags
content = content.substr(endOfFirstTagIndex + 1, content.length - endOfFirstTagIndex - 5).trim();
if (closingNoteIndex !== -1) {
content = content.substr(0, closingNoteIndex);
}
content = content.trim();
// workaround for https://github.com/ckeditor/ckeditor5-list/issues/116
content = content.replace(/<li>\s+<div>/g, "<li>");
@ -202,10 +191,7 @@ async function importEnex(taskContext, file, parentNote) {
// make a copy because stream continues with the next async call and note gets overwritten
let {title, content, attributes, resources, utcDateCreated} = note;
const xmlObject = await parseXml(content);
// following is workaround for this issue: https://github.com/Leonidas-from-XIV/node-xml2js/issues/484
content = extractContent(xmlObject['en-note']);
content = extractContent(content);
const noteEntity = (await noteService.createNote(rootNote.noteId, title, content, {
attributes,