mirror of
https://github.com/Jermolene/TiddlyWiki5
synced 2024-11-29 12:59:56 +00:00
Fix: Evernote .enex image import (#7785)
* feat: add modifier info * feat: replace image and attachment with [img[] and [[]] * feat: import as wikitext tid * fix: a few resources don't have title * fix: use hash as random name for images * fix: Firefox's DOMParser have problem in some cases * fix: bad char in title, and useless xmlns * Update sample-enex-with-image.xml.enex * Update enex-deserializer.js * Update readme.tid * fix: some dont have modified
This commit is contained in:
parent
efa4f34131
commit
d3f5695601
@ -15,6 +15,7 @@ For details see: https://blog.evernote.com/tech/2013/08/08/evernote-export-forma
|
|||||||
"use strict";
|
"use strict";
|
||||||
|
|
||||||
// DOMParser = require("$:/plugins/tiddlywiki/xmldom/dom-parser").DOMParser;
|
// DOMParser = require("$:/plugins/tiddlywiki/xmldom/dom-parser").DOMParser;
|
||||||
|
var illegalFilenameCharacters = /[\[\]<>;\:\"\/\\\|\?\*\^\?\$\(\)\s~]/g;
|
||||||
|
|
||||||
/*
|
/*
|
||||||
Parse an ENEX file into tiddlers
|
Parse an ENEX file into tiddlers
|
||||||
@ -23,10 +24,13 @@ exports["application/enex+xml"] = function(text,fields) {
|
|||||||
// Collect output tiddlers in an array
|
// Collect output tiddlers in an array
|
||||||
var results = [];
|
var results = [];
|
||||||
// Parse the XML document
|
// Parse the XML document
|
||||||
var parser = new DOMParser(),
|
var doc = new DOMParser().parseFromString(text,"application/xml");
|
||||||
doc = parser.parseFromString(text,"application/xml");
|
|
||||||
// Output a report tiddler with information about the import
|
// Output a report tiddler with information about the import
|
||||||
var enex = doc.querySelector("en-export");
|
var enex = doc.querySelector("en-export");
|
||||||
|
if(!enex) {
|
||||||
|
// Firefox's DOMParser have problem in some cases.
|
||||||
|
throw new Error('Failed to parse ENEX file, no "en-export" node found, try use Chrome/Edge to export again.');
|
||||||
|
}
|
||||||
results.push({
|
results.push({
|
||||||
title: "Evernote Import Report",
|
title: "Evernote Import Report",
|
||||||
text: "Evernote file imported on " + enex.getAttribute("export-date") + " from " + enex.getAttribute("application") + " (" + enex.getAttribute("version") + ")"
|
text: "Evernote file imported on " + enex.getAttribute("export-date") + " from " + enex.getAttribute("application") + " (" + enex.getAttribute("version") + ")"
|
||||||
@ -34,47 +38,102 @@ exports["application/enex+xml"] = function(text,fields) {
|
|||||||
// Get all the "note" nodes
|
// Get all the "note" nodes
|
||||||
var noteNodes = doc.querySelectorAll("note");
|
var noteNodes = doc.querySelectorAll("note");
|
||||||
$tw.utils.each(noteNodes,function(noteNode) {
|
$tw.utils.each(noteNodes,function(noteNode) {
|
||||||
var result = {
|
var noteTitle = getTextContent(noteNode,"title");
|
||||||
title: getTextContent(noteNode,"title"),
|
// get real note content node
|
||||||
type: "text/html",
|
var contentNode = noteNode.querySelector("content")
|
||||||
|
var contentText = (contentNode.textContent || "").replace(/ /g, ' ').trim();
|
||||||
|
if(contentText) {
|
||||||
|
// The final content will be HTML instead of xml. And we will save it as wikitext, to make wiki syntax work, and remaining HTML will also work.
|
||||||
|
try {
|
||||||
|
// may error if content is not valid XML
|
||||||
|
contentNode = new DOMParser().parseFromString(contentText,"application/xml").querySelector("en-note") || contentNode;
|
||||||
|
} catch(e) {
|
||||||
|
// ignore
|
||||||
|
}
|
||||||
|
}
|
||||||
|
// process main content and metadata, and save as wikitext tiddler.
|
||||||
|
var noteResult = {
|
||||||
|
title: noteTitle.replace(illegalFilenameCharacters,"_"),
|
||||||
tags: [],
|
tags: [],
|
||||||
text: getTextContent(noteNode,"content"),
|
modified: convertDate(getTextContent(noteNode,"updated") || getTextContent(noteNode,"created")),
|
||||||
modified: convertDate(getTextContent(noteNode,"created")),
|
modifier: getTextContent(noteNode,"author"),
|
||||||
created: convertDate(getTextContent(noteNode,"created"))
|
created: convertDate(getTextContent(noteNode,"created")),
|
||||||
|
creator: getTextContent(noteNode,"author")
|
||||||
};
|
};
|
||||||
|
// process resources (images, PDFs, etc.)
|
||||||
|
$tw.utils.each(noteNode.querySelectorAll("resource"),function(resourceNode) {
|
||||||
|
// hash generated by applying https://github.com/vzhd1701/evernote-backup/pull/54
|
||||||
|
var hash = resourceNode.querySelector("data").getAttribute("hash");
|
||||||
|
var text = getTextContent(resourceNode,"data");
|
||||||
|
var mimeType = getTextContent(resourceNode,"mime");
|
||||||
|
var contentTypeInfo = $tw.config.contentTypeInfo[mimeType] || {extension:""};
|
||||||
|
var title = getTextContent(resourceNode,"resource-attributes>file-name")
|
||||||
|
// a few resources don't have title, use hash as fallback
|
||||||
|
title = title || (hash + contentTypeInfo.extension);
|
||||||
|
// replace all system reserved characters in title
|
||||||
|
title = title.replace(illegalFilenameCharacters,"_");
|
||||||
|
// prefix image title with note title, to avoid name conflicts which is quite common in web-clipped content
|
||||||
|
title = noteResult.title + "/" + title;
|
||||||
|
results.push({
|
||||||
|
title: title,
|
||||||
|
type: mimeType,
|
||||||
|
width: getTextContent(resourceNode,"width"),
|
||||||
|
height: getTextContent(resourceNode,"height"),
|
||||||
|
text: text,
|
||||||
|
// give image same modified and modifier as the note, so they can be grouped together in the "Recent"
|
||||||
|
modified: noteResult.modified,
|
||||||
|
modifier: noteResult.modifier,
|
||||||
|
created: noteResult.created,
|
||||||
|
creator: noteResult.creator
|
||||||
|
});
|
||||||
|
if(hash) {
|
||||||
|
fixAttachmentReference(contentNode, hash, mimeType, title);
|
||||||
|
}
|
||||||
|
});
|
||||||
|
// export mixed content of wikitext and HTML
|
||||||
|
noteResult.text = contentNode.innerHTML;
|
||||||
|
// remove all ` xmlns="http://www.w3.org/1999/xhtml"` attributes to save some space
|
||||||
|
noteResult.text = noteResult.text.replace(/ xmlns="http:\/\/www.w3.org\/1999\/xhtml"/g, "");
|
||||||
$tw.utils.each(noteNode.querySelectorAll("tag"),function(tagNode) {
|
$tw.utils.each(noteNode.querySelectorAll("tag"),function(tagNode) {
|
||||||
result.tags.push(tagNode.textContent);
|
noteResult.tags.push(tagNode.textContent);
|
||||||
});
|
});
|
||||||
// If there's an update date, set modifiy date accordingly
|
// If there's an update date, set modifiy date accordingly
|
||||||
var update = getTextContent(noteNode,"updated");
|
var update = getTextContent(noteNode,"updated");
|
||||||
if(update) {
|
if(update) {
|
||||||
result.modified = convertDate(update);
|
noteResult.modified = convertDate(update);
|
||||||
}
|
}
|
||||||
$tw.utils.each(noteNode.querySelectorAll("note-attributes>*"),function(attrNode) {
|
$tw.utils.each(noteNode.querySelectorAll("note-attributes>*"),function(attrNode) {
|
||||||
result[attrNode.tagName] = attrNode.textContent;
|
noteResult[attrNode.tagName] = attrNode.textContent;
|
||||||
});
|
|
||||||
results.push(result);
|
|
||||||
$tw.utils.each(noteNode.querySelectorAll("resource"),function(resourceNode) {
|
|
||||||
results.push({
|
|
||||||
title: getTextContent(resourceNode,"resource-attributes>file-name"),
|
|
||||||
type: getTextContent(resourceNode,"mime"),
|
|
||||||
width: getTextContent(resourceNode,"width"),
|
|
||||||
height: getTextContent(resourceNode,"height"),
|
|
||||||
text: getTextContent(resourceNode,"data")
|
|
||||||
});
|
|
||||||
});
|
});
|
||||||
|
results.push(noteResult);
|
||||||
});
|
});
|
||||||
// Return the output tiddlers
|
// Return the output tiddlers
|
||||||
return results;
|
return results;
|
||||||
};
|
};
|
||||||
|
|
||||||
function getTextContent(node,selector) {
|
function getTextContent(node,selector) {
|
||||||
return (node.querySelector(selector) || {}).textContent;
|
return (node.querySelector(selector) || {}).textContent || "";
|
||||||
}
|
}
|
||||||
|
|
||||||
function convertDate(isoDate) {
|
function convertDate(isoDate) {
|
||||||
return (isoDate || "").replace("T","").replace("Z","") + "000"
|
return (isoDate || "").replace("T","").replace("Z","") + "000"
|
||||||
}
|
}
|
||||||
|
|
||||||
|
function fixAttachmentReference(contentNode, md5Hash, mimeType, name) {
|
||||||
|
if(!contentNode) return;
|
||||||
|
var mediaNode = contentNode.querySelector('en-media[hash="' + md5Hash + '"]');
|
||||||
|
if(!name) {
|
||||||
|
throw new Error("name is empty for resource hash" + md5Hash);
|
||||||
|
}
|
||||||
|
if(!mediaNode) return;
|
||||||
|
if(mimeType.indexOf("image/") === 0) {
|
||||||
|
// find en-media node, replace with image syntax
|
||||||
|
mediaNode.parentNode.replaceChild($tw.utils.domMaker("p", {text: "[img["+ name + "]]"}), mediaNode);
|
||||||
|
} else {
|
||||||
|
// For other than image attachments, we make a link to the tiddler
|
||||||
|
mediaNode.parentNode.replaceChild($tw.utils.domMaker("p", {text: "[["+ name + "]]"}), mediaNode);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
})();
|
})();
|
||||||
|
@ -5,6 +5,7 @@ This plugin contains tool to assist migration of content from Evernote ENEX file
|
|||||||
!! Instructions
|
!! Instructions
|
||||||
|
|
||||||
# Download or save your ENEX file from Evernote
|
# Download or save your ENEX file from Evernote
|
||||||
|
## Use [ext[evernote-backup|https://github.com/vzhd1701/evernote-backup]] to export ENEX file with resource hash, so images can be linked in the note
|
||||||
# Rename the file to have an `.enex` extension
|
# Rename the file to have an `.enex` extension
|
||||||
# Drag the file into the TiddlyWiki browser window
|
# Drag the file into the TiddlyWiki browser window
|
||||||
## Alternatively, click the "Import" button in the "Tools" sidebar tab
|
## Alternatively, click the "Import" button in the "Tools" sidebar tab
|
||||||
|
File diff suppressed because one or more lines are too long
Loading…
Reference in New Issue
Block a user