ThisTest/translators/Endnote XML.js

1365 lines
54 KiB
JavaScript
Raw Normal View History

2022-03-23 12:58:01 +01:00
{
"translatorID": "eb7059a4-35ec-4961-a915-3cf58eb9784b",
"label": "Endnote XML",
"creator": "Sebastian Karcher",
"target": "xml",
"minVersion": "4.0",
"maxVersion": "",
"priority": 100,
"configOptions": {
"async": true,
"getCollections": true
},
"displayOptions": {
"exportNotes": true,
"exportFileData": false
},
"inRepository": true,
"translatorType": 3,
"browserSupport": "gcv",
"lastUpdated": "2018-06-12 09:00:41"
}
function detectImport() {
var doc = Zotero.getXML().documentElement;
if (!doc) {
return false;
} else if (ZU.xpathText(doc, '//record/ref-type')) {
return true;
}
}
//list of Endnote XML fields used for export (same for title, date, periodical, and author fields below)
var fields = ["database", "source-app", "rec-number", "ref-type", "contributors",
"auth-address", "auth-affiliaton", "titles", "periodical", "pages", "volume",
"number", "issue", "secondary-volume", "secondary-issue", "num-vols", "edition",
"section", "reprint-edition", "reprint-status", "keywords", "dates", "pub-location",
"publisher", "orig-pub", "isbn", "accession-num", "call-num", "report-id", "coden",
"electronic-resource-num", "abstract", "label", "image", "caption", "notes",
"research-notes", "work-type", "reviewed-item", "availability", "remote-source",
"meeting-place", "work-location", "work-extent", "pack-method", "size", "repro-ratio",
"remote-database-name", "remote-database-provider", "language", "urls", "access-date",
"modified-date", "custom1", "custom2", "custom3", "custom4", "custom5", "custom6",
"custom7", "misc1", "misc2", "misc3"
];
var titleFields = ["title", "secondary-title", "tertiary-title", "alt-title", "short-title",
"translated-title"
];
var dateFields = ["year", "pub-dates"];
var periodicalFields = ["full-title", "abbr-1", "abbr-2", "abbr-3"];
var authorFields = ["authors", "secondary-authors", "tertiary-authors", "subsidiary-authors",
"translated-authors"
];
var attachmentFields = ["pdf-urls", "text-urls", "related-urls", "image-urls"];
var processItemType = {
Artwork: "artwork",
"Audiovisual Material": "videoRecording",
Bill: "bill",
"Book Section": "bookSection",
Book: "book",
"Case": "case",
Catalog: "book",
"Computer Program": "computerProgram",
"Conference Proceedings": "conferencePaper", //still not clear on paper vs. proceedings
"Web Page": "webpage",
"Generic": "document",
"Hearing": "hearing",
"Journal Article": "journalArticle",
"Magazine Article": "magazineArticle",
Map: "map",
"Film or Broadcast": "film",
"Newspaper Article": "newspaperArticle",
Pamphlet: "manuscript",
Patent: "patent",
"Personal Communication": "letter",
Report: "report",
"Edited Book": "book",
Statute: "statute",
Thesis: "thesis",
"Unpublished Work": "manuscript",
Manuscript: "manuscript",
Figure: "artwork", //mapping
"Chart or Table": "artwork", //mapping?
"Equation": "artwork", //mapping?
"Electronic Article": "journalArticle",
"Electronic Book": "book",
"Online Database": "webpage",
"Government Document": "bill",
"Conference Paper": "presentation",
"Online Multimedia": "webpage",
"Classical Work": "book", //mapping once we have something comparable in Zotero
"Legal Rule or Regulation": "report", //or bill? statute?
"Ancient Text": "book", //mapping
Dictionary: "dictionaryEntry",
Encyclopedia: "encyclopediaArticle",
Grant: "report",
"Aggregated Database": "webpage", //mapping?
"Blog": "blogPost",
"Serial": "book", //should map to periodical once we have that
Standard: "report", //map to standard once we have that
Dataset: "report", //map to dataset once we have that
"Electronic Book Section": "bookSection",
Music: "audioRecording"
};
var processNumberType = {
2: "artwork",
3: "videoRecording",
4: "bill",
5: "bookSection",
6: "book",
7: "case",
8: "book",
9: "computerProgram",
10: "conferencePaper",
12: "webpage",
13: "document",
14: "hearing",
17: "journalArticle",
19: "magazineArticle",
20: "map",
21: "film",
23: "newspaperArticle",
24: "manuscript",
25: "patent",
26: "letter",
27: "report",
28: "book",
31: "statute",
32: "thesis",
34: "manuscript",
36: "manuscript",
37: "artwork",
38: "artwork",
39: "artwork",
43: "journalArticle",
44: "book",
45: "wepage",
46: "bill",
47: "conferencePaper",
48: "webpage",
49: "book",
50: "report",
51: "book",
52: "dictionaryEntry",
53: "encyclopediaArticle",
54: "report",
55: "webpage",
56: "blogPost",
57: "book",
58: "report",
59: "report",
60: "bookSection",
61: "audioRecording"
};
var exportItemType = {
artwork: "Artwork",
audioRecording: "Music",
bill: "Bill",
blogPost: "Blog",
book: "Book",
bookSection: "Book Section",
"case" :"Case",
computerProgram: "Computer Program",
conferencePaper: "Conference Proceedings",
dictionaryEntry: "Dictionary",
document: "Generic",
mail: "Personal Communication",
encyclopediaArticle: "Encyclopedia",
film: "Film or Broadcast",
forumPost: "Web Page",
hearing: "Hearing",
instantMessage: "Personal Communication",
interview: "Personal Communication",
journalArticle: "Journal Article",
letter: "Personal Communication",
magazineArticle: "Magazine Article",
manuscript: "Manuscript",
map: "Map",
newspaperArticle: "Newspaper Article",
patent: "Patent",
podcast: "Film or Broadcast",
presentation: "Conference Paper",
radioBroadcast: "Film or Broadcast",
report: "Report",
statute: "Statute",
thesis: "Thesis",
tvBroadcast: "Film or Broadcast",
videoRecording: "Audiovisual Material",
webpage: "Web Page"
};
var exportRefNumber = {
artwork: "2",
videoRecording: "3",
bill: "4",
blogPost: "56",
book: "6",
bookSection: "5",
"case": "6",
computerProgram: "9",
presentation: "47",
conferencePaper: "10",
dictionaryEntry: "52",
encyclopediaArticle: "53",
film: "21",
podcast: "21",
radioBroadcast: "21",
tvBroadcast: "21",
document: "13",
hearing: "14",
journalArticle: "17",
magazineArticle: "19",
manuscript: "36",
map: "20",
audioRecording: "61",
newspaperArticle: "23",
patent: "25",
email: "26",
instantMessage: "26",
interview: "26",
letter: "26",
report: "27",
statute: "31",
thesis: "32",
forumPost: "12",
webpage: "12"
};
var fieldMap = {
//same for all itemTypes
abstract: "abstractNote",
"call-num": "callNumber",
"electronic-resource-num": "DOI",
"remote-database-name": "libraryCatalog",
"abbr-1": "journalAbbreviation",
"short-title": "shortTitle",
"full-title": "publicationTitle",
language: "language",
"access-date": "accessDate",
//These two are in the RIS - not sure what they'd be in Endnote XML
//DB:"archive",
//AN:"archiveLocation",
//type specific
//tag => field:itemTypes
//if itemType not explicitly given, __default field is used
// unless itemType is excluded in __exclude
"title": {
"__default": "title",
subject: ["email"],
caseName: ["case"],
nameOfAct: ["statute"]
},
"secondary-title": {
code: ["bill", "statute"],
bookTitle: ["bookSection"],
blogTitle: ["blogPost"],
conferenceName: ["conferencePaper"],
dictionaryTitle: ["dictionaryEntry"],
encyclopediaTitle: ["encyclopediaArticle"],
committee: ["hearing"],
forumTitle: ["forumPost"],
websiteTitle: ["webpage"],
programTitle: ["radioBroadcast", "tvBroadcast"],
meetingName: ["presentation"],
seriesTitle: ["computerProgram", "map", "report"],
series: ["book"],
reporter: ["case"],
publicationTitle: ["journalArticle", "magazineArticle", "newspaperArticle"]
},
"tertiary-title": {
legislativeBody: ["hearing", "bill"],
series: ["bookSection", "conferencePaper"],
seriesTitle: ["audioRecording"]
},
//NOT HANDLED: reviewedAuthor, scriptwriter, contributor, guest
"authors": {
"__default": "author",
"artist": ["artwork"],
"cartographer": ["map"],
"composer": ["audioRecording"],
"director": ["film", "radioBroadcast", "tvBroadcast", "videoRecording"],
"interviewee": ["interview"],
"inventor": ["patent"],
"podcaster": ["podcast"],
"programmer": ["computerProgram"]
},
"secondary-authors": {
"sponsor": ["bill"],
"performer": ["audioRecording"],
"presenter": ["presentation"],
"interviewer": ["interview"],
"editor": ["journalArticle", "bookSection", "conferencePaper", "dictionaryEntry", "document",
"encyclopediaArticle"
],
"seriesEditor": ["book", "report"],
"recipient": ["email", "instantMessage", "letter"],
issuingAuthority: ["patent"]
},
"tertiary-authors": {
"cosponsor": ["bill"],
"producer": ["film", "tvBroadcast", "videoRecording", "radioBroadcast"],
"editor": ["book"],
"seriesEditor": ["bookSection", "conferencePaper", "dictionaryEntry", "encyclopediaArticle", "map"]
},
"subsidiary-authors": {
"__default": "translator",
"counsel": ["case"],
"castMember": ["radioBroadcast", "tvBroadcast", "videoRecording"],
"contributor": ["conferencePaper", "film"] //translator does not fit these
},
"work-type": {
"manuscriptType": ["manuscript"],
"websiteType": ["webpage"],
"genre": ["film"],
"postType": ["forumPost"],
"letterType": ["letter"],
"mapType": ["map"],
"presentationType": ["presentation"],
"reportType": ["report"],
"thesisType": ["thesis"]
},
custom1: {
filingDate: ["patent"], //not in spec
scale: ["map"],
place: ["conferencePaper"]
},
custom2: {
issueDate: ["patent"]
//PMCID:["journalArticle"] //handled below since we don't actually have that variable (yet)
},
custom3: {
artworkSize: ["artwork"],
proceedingsTitle: ["conferencePaper"],
runningTime: ["videoRecording"],
country: ["patent"]
},
custom4: {
//RIS has this, but I can't find any reason for that: "creators/wordsBy":["audioRecording"],
"creators/attorneyAgent":["patent"], //we're not using this for export
genre: ["film"]
},
custom5: {
references: ["patent"],
audioRecordingFormat: ["audioRecording", "radioBroadcast"],
videoRecordingFormat: ["film", "tvBroadcast", "videoRecording"]
},
custom6: {
legalStatus: ["patent"],
},
"pub-location": {
"__default": "place",
"__exclude": ["conferencePaper"] //exported/imported as "custom1"
},
"pub-dates": { //also see year when editing
"__default": "date",
dateEnacted: ["statute"],
dateDecided: ["case"],
issueDate: ["patent"]
},
edition: {
"__default": "edition",
// "__ignore":["journalArticle"], //EPubDate.
session: ["bill", "hearing", "statute"],
version: ["computerProgram"]
},
issue: {
"__default": "issue",
numberOfVolumes: ["bookSection"]
},
misc1: {
seriesNumber: ["book"],
billNumber: ["bill"],
system: ["computerProgram"],
documentNumber: ["hearing"],
applicationNumber: ["patent"],
publicLawNumber: ["statute"],
episodeNumber: ["podcast", "radioBroadcast", "tvBroadcast"]
},
misc2: {
manuscriptType: ["manuscript"],
mapType: ["map"],
reportType: ["report"],
thesisType: ["thesis"],
websiteType: ["blogPost", "webpage"],
postType: ["forumPost"],
letterType: ["letter"],
interviewMedium: ["interview"],
presentationType: ["presentation"],
artworkMedium: ["artwork"],
audioFileType: ["podcast"]
},
"num-vols": {
"__default": "numberOfVolumes",
"__exclude": ["bookSection"] //uses "issue" instead
},
"orig-pub": {
history: ["hearing", "statute", "bill", "case"],
priorityNumbers: ["patent"]
},
publisher: {
"__default": "publisher",
label: ["audioRecording"],
court: ["case"],
distributor: ["film"],
assignee: ["patent"],
institution: ["report"],
university: ["thesis"],
company: ["computerProgram"],
studio: ["videoRecording"],
network: ["radioBroadcast", "tvBroadcast"]
},
year: { //duplicate of pud-dates, but this will only output year
"__default": "date",
dateEnacted: ["statute"],
dateDecided: ["case"],
issueDate: ["patent"]
},
section: {
"__default": "section", //though this can refer to pages, start page, etc. for some types. Zotero does not support any of those combinations, however.
"__exclude": ["case"]
},
isbn: {
"__default": "ISBN",
ISSN: ["journalArticle", "magazineArticle", "newspaperArticle"],
patentNumber: ["patent"],
reportNumber: ["report"],
},
pages: {
"__default": "pages",
codePages: ["bill"], //bill
numPages: ["book", "thesis", "manuscript"],
firstPage: ["case"],
runningTime: ["film"]
},
number: {
seriesNumber: ["bookSection", "book"],
issue: ["journalArticle", "magazineArticle"],
docketNumber: ["case"],
artworkSize: ["artwork"]
},
volume: {
"__default": "volume",
codeNumber: ["statute"],
codeVolume: ["bill"],
reporterVolume: ["case"],
"__exclude": ["patent", "webpage"]
}
};
var cache = {};
function getField(field, type) {
if (!cache[type]) cache[type] = {};
//retrieve from cache if available
//it can be false if previous search did not find a mapping
if (cache[type][field] !== undefined) {
return cache[type][field];
}
var zfield = false;
if (typeof (fieldMap[field]) == 'object') {
var def, exclude = false;
for (var f in fieldMap[field]) {
//__ignore is not handled here. It's returned as a Zotero field so it
//can be explicitly excluded from the note attachment
if (f == "__default") {
//store default mapping in case we can't find anything explicit
def = fieldMap[field][f];
continue;
}
if (f == "__exclude") {
if (fieldMap[field][f].indexOf(type) != -1) {
exclude = true; //don't break. Let explicit mapping override this
}
continue;
}
if (fieldMap[field][f].indexOf(type) != -1) {
zfield = f;
break;
}
}
//assign default value if not excluded
if (!zfield && def && !exclude) zfield = def;
} else if (typeof (fieldMap[field]) == 'string') {
zfield = fieldMap[field];
}
cache[type][field] = zfield;
return zfield;
}
function doImport() {
if (typeof Promise == 'undefined') {
startImport(
function () {},
function (e) {
throw e;
}
);
}
else {
return new Promise(function (resolve, reject) {
startImport(resolve, reject);
});
}
}
function startImport(resolve, reject) {
try {
var xml = Zotero.getXML();
var records = ZU.xpath(xml, "//record");
importNext(records, 0, resolve, reject);
}
catch (e) {
reject(e);
}
}
function importNext(records, index, resolve, reject) {
try {
//Z.debug(records.length)
for (var i = index, n = records.length; i < n; i++) {
Z.setProgress(i/n*100);
var record = records[i];
newItem = new Zotero.Item();
//we prefer the name of the ref-type as it e.g. works with Mendeley and probably other Endnote 7 exports
newItem.itemType = processItemType[ZU.xpathText(record, './/ref-type/@name')];
//fall back to ref-type number
if (!newItem.itemType) newItem.itemType = processNumberType[ZU.xpathText(record, './/ref-type')];
//fall back to journal Article if all else fails
if (!newItem.itemType) newItem.itemType = "journalArticle";
var notecache = [];
//Z.debug(newItem.itemType)
for (var j = 0; j < record.children.length; j++) {
var node = record.children[j];
var field = node.nodeName;
var zfield;
if (zfield = getField(field, newItem.itemType)) {
if (zfield.indexOf("creators") != -1) {
var authortype = zfield.replace(/creators\//, "");
newItem.creators.push(ZU.cleanAuthor(node.textContent, authortype))
} else if (ZU.fieldIsValidForType(zfield, newItem.itemType)) {
if (zfield == 'abstractNote') {
// Preserve newlines
newItem[zfield] = processField(node, true)
.replace(/\r\n?/g, '\n');
} else {
newItem[zfield] = processField(node);
}
}
else {
notecache.push(field + ": " + processField(node));
}
} else if (field == "titles" || field == "periodical" || field == "alt-periodical") {
for (var k = 0; k < node.children.length; k++) {
var subnode = node.children[k];
var subfield = subnode.nodeName;
if (zfield = getField(subfield, newItem.itemType)) {
//Z.debug(zfield)
if (ZU.fieldIsValidForType(zfield, newItem.itemType)) {
newItem[zfield] = processField(subnode);
}
else {
notecache.push(field + ": " + processField(subnode));
}
} else {
notecache.push(subfield + ": " + processField(subnode));
}
}
} else if (field == "contributors") {
for (var k = 0; k < node.children.length; k++) {
var subnode = node.children[k];
var subfield = subnode.nodeName;
var authortype;
if (authortype = getField(subfield, newItem.itemType)) {
var creators = subnode.getElementsByTagName("author");
for (var l = 0; l < creators.length; l++) {
if (authortype) {
newItem.creators.push(ZU.cleanAuthor(creators[l].textContent, authortype, true));
}
else {
notecache.push(subfield + ": " + processField(subnode));
}
}
} else {
notecache.push(subfield + ": " + processField(subnode));
}
}
} else if (field == "dates") {
var date = node.getElementsByTagName("pub-dates");
var year = node.getElementsByTagName("year");
if (date.length > 0 && year.length > 0) {
date = date[0].getElementsByTagName("date")[0].textContent.trim();
year = year[0].textContent.trim();
if (date.search(/\d{4}/) != -1) newItem.date = date;
else newItem.date = date + " " + year;
} else if (date.length > 0) {
newItem.date = date[0].firstChild.textContent;
} else if (year.length > 0) {
newItem.date = year[0].textContent;
} else if (node.textContent.trim().length > 0) {
//there is only copyright note left;
notecache.push("copyright-dates: " + node.textContent)
}
} else if (field == "notes" || field == "research-notes") {
newItem.notes.push(
'<p>' + processField(node, true, 'note')
.split(/(?:\r\n|\r(?!\n)|\n){2,}/) // Double newlines (or more) are paragraphs
.join('</p><p>')
.replace(/[\r\n]+/g, '<br/>') // Single newlines are just new lines
+ '</p>'
);
} else if (field == "keywords") {
for (var k = 0; k < node.children.length; k++) {
var subnode = node.children[k];
newItem.tags.push(subnode.textContent.trim())
}
} else if (field == "urls") {
for (var k = 0; k < node.children.length; k++) {
var subnode = node.children[k];
var attachmenttype = "";
switch (subnode.nodeName){
case "text-urls":
case "related-urls":
attachmenttype="text/html";
break;
case "web-urls":
attachmenttype="url";
break;
case "pdf-urls":
attachmenttype="application/pdf";
}
for (var l = 0; l < subnode.children.length; l++) {
if (subnode.children[l].nodeType == 3) continue;
var filepath = subnode.children[l].textContent;
if (!filepath) continue
//support for EndNote's relative paths
filepath = filepath.replace(/^internal-pdf:\/\//i, 'PDF/').trim();
var filename = filepath.replace(/.+\//, "").replace(/\.[^\.]+$/, "");
if (attachmenttype == "url") {
newItem.url = subnode.textContent;
} else {
newItem.attachments.push({
title: filename,
path: filepath,
mimeType: attachmenttype
})
}
}
}
} else if (field.search(/custom[237]/) != -1 &&
(newItem.itemType == "book" || newItem.itemType == "bookSection" || newItem.itemType == "journalArticle")) {
//it'd be nice if we could do PMIDs as well, but doesn't look like they're mapped and we can't test for them reliably
if (node.textContent.search(/PMC\d+/i) != -1) {
newItem.extra = "PMCID: " + node.textContent.match(/PMC\d+/i)[0];
}
} else if (field == "database" || field == "source-app" || field == "rec-number" || field == "ref-type"
|| field == "foreign-keys"){
//skipping these fields
} else {
notecache.push(node.nodeName + ": " + processField(node));
}
}
if (notecache.length > 0){
newItem.notes.push({note: "The following values have no corresponding Zotero field:<br/>" + notecache.join("<br/>"), tags: ['_EndnoteXML import']})
}
var maybePromise = newItem.complete();
if (maybePromise) {
maybePromise.then(function () {
importNext(records, i + 1, resolve, reject);
});
return;
}
}
}
catch (e) {
reject(e);
}
resolve();
}
function doExport() {
Zotero.setCharacterSet("utf-8");
var parser = new DOMParser();
var doc = parser.parseFromString('<xml/>', 'application/xml');
var records = doc.createElement("records");
var item;
while (item = Zotero.nextItem()) {
// Don't export notes or standalone attachments
if (item.itemType === "note" || item.itemType === "attachment") continue;
var record = doc.createElement("record");
for (var f=0; f<fields.length; f++) {
switch (fields[f]) {
case 'database':
mapProperty(record, "database", "MyLibrary", {
"name": "MyLibrary"
});
break;
case 'source-app':
mapProperty(record, "source-app", "Zotero", {
"name": "Zotero"
});
break;
case 'ref-type':
var type = exportItemType[item.itemType];
var typeNumber = exportRefNumber[item.itemType];
mapProperty(record, "ref-type", typeNumber, {
"name": type
})
break;
case 'titles':
var titles = doc.createElement("titles");
for (var i = 0; i < titleFields.length; i++) {
var titleField = titleFields[i];
var zfield = getField(titleField, item.itemType);
if (item[zfield]) mapProperty(titles, titleField, item[zfield]);
}
record.appendChild(titles);
break;
case 'contributors':
if (item.creators.length > 0) {
var contributors = doc.createElement("contributors");
for (var i = 0; i < authorFields.length; i++) {
var custom4 =[];
var creatornode = doc.createElement(authorFields[i]);
var type = getField(authorFields[i], item.itemType);
for (var j = 0; j < item.creators.length; j++) {
if (item.creators[j].creatorType == type) {
var name = item.creators[j].lastName;
if (item.creators[j].firstName) name += ", " + item.creators[j].firstName;
mapProperty(creatornode, "author", name);
}
//deal with creators that are mapped to regular fields, currently only one
else if (item.creators[j].creatorType=="attorneyAgent") {
var name = item.creators[j].lastName;
if (item.creators[j].firstName) name += ", " + item.creators[j].firstName;
custom4.push(name);
}
}
if (creatornode.hasChildNodes()) {
contributors.appendChild(creatornode);
}
}
if (custom4.length>0){
mapProperty(record, "custom4", custom4.join("; "));
}
record.appendChild(contributors);
}
break;
case 'dates':
var dates = doc.createElement("dates");
var zfield = getField("pub-dates", item.itemType);
if (item[zfield]) {
var dateobject = ZU.strToDate(item[zfield]);
if (dateobject.year) mapProperty(dates, "year", dateobject.year);
var pubdates = doc.createElement("pub-dates");
dates.appendChild(pubdates);
mapProperty(pubdates, "date", item[zfield]);
}
record.appendChild(dates);
break;
case 'periodical':
var periodical = doc.createElement("periodical");
var zfield = getField("full-title", item.itemType);
if (item[zfield]) {
mapProperty(periodical, "full-title", item[zfield]);
}
var zfield = getField("abbr-1", item.itemType);
if (item[zfield]) {
mapProperty(periodical, "abbr-1", item[zfield]);
}
if (periodical.children.length > 0) record.appendChild(periodical);
break;
case 'keywords':
if (item.tags.length > 0) {
var keywords = doc.createElement("keywords");
for (var i = 0; i < item.tags.length; i++) {
mapProperty(keywords, "keyword", item.tags[i].tag);
}
record.appendChild(keywords);
}
break;
case 'research-notes':
if (item.notes && item.notes.length && Zotero.getOption("exportNotes")) {
mapProperty(record, "research-notes",
item.notes.reduce(function(s, n) {
return s + '<p>' + n.note + '</p>'; // EndNote only supports a single note field, so concatenate all notes into one
}, '')
);
}
break;
case 'urls':
var urls = doc.createElement("urls");
if (item.url) {
var weburls = doc.createElement("web-urls");
urls.appendChild(weburls);
mapProperty(weburls, "url", item.url);
}
if (item.attachments.length) {
var pdfurls = doc.createElement("pdf-urls");
var texturls = doc.createElement("text-urls");
var exportFileData = Zotero.getOption("exportFileData");
for (var i=0; i< item.attachments.length; i++) {
var attachment = item.attachments[i];
var path;
if ( exportFileData && attachment.saveFile) {
path = attachment.defaultPath.replace(/^files\//, '');
attachment.saveFile('PDF/' + path, true);
path = 'internal-pdf://' + path;
} else {
path = attachment.localPath || attachment.url;
}
if (!path) continue;
if (attachment.mimeType == "application/pdf") {
mapProperty(pdfurls, "url", path);
} else {
mapProperty(texturls, "url", path);
}
}
if (pdfurls.children.length) urls.appendChild(pdfurls);
if (texturls.children.length) urls.appendChild(texturls);
}
if (urls.children.length) record.appendChild(urls);
break;
default:
var zfield = getField(fields[f], item.itemType);
//Z.debug(fields[f] + ": " + zfield);
if (item[zfield]) mapProperty(record, fields[f], item[zfield]);
}
}
records.appendChild(record);
}
doc.documentElement.appendChild(records);
Zotero.write('<?xml version="1.0" encoding="UTF-8"?>\n');
var serializer = new XMLSerializer();
Zotero.write(serializer.serializeToString(doc)
.replace(/\r\n?|\n/g, '&#xD;') // Follow EndNote convention for newlines (carriage return entity)
);
}
//******IMPORT Functions
/**
* Convert XML style elements to Zotero HTML mark-up
* Works with nested style nodes or with multiple styling descriptors in a single face attribute
*
* @param {node} a DOM element
*
* @return {String} String with HTML mark-up
*/
var en2zMap = {
italic: 'i',
bold: 'b',
superscript: 'sup',
subscript: 'sub'
};
var en2zNoteMap = Object.create(en2zMap);
en2zNoteMap.underline = 'u';
function htmlify(nodes, field) {
var htmlstr = "",
formatting = [],
map = field == 'note' ? en2zNoteMap : en2zMap;
if (nodes.childNodes.length == 1 && nodes.childNodes[0].nodeType == 3) {
//single text node
return nodes.textContent;
}
for (var i=0; i<nodes.children.length; i++) {
var node = nodes.children[i];
var face = node.getAttribute('face')
if (face) {
face = face.split(/\s+/)
//filter out tags we don't care about
.filter(function(f) { return !!map[f] });
} else {
face = [];
}
//see what we're closing
var closing = [];
for (var j=0; j<formatting.length; j++) {
if (face.indexOf(formatting[j]) == -1) {
closing.push(map[formatting[j]]);
formatting.splice(j,1);
j--;
}
}
if (closing.length) htmlstr += '</' + closing.reverse().join('></') + '>';
//see what we're opening
var opening = [];
for (var j=0; j<face.length; j++) {
if (!map[face[j]]) continue;
if (formatting.indexOf(face[j]) == -1) {
opening.push(map[face[j]]);
formatting.push(face[j]);
}
}
if (opening.length) htmlstr += '<' + opening.join('><') + '>';
htmlstr += node.textContent;
}
//close left-over tags
var closing = [];
for (var j=0; j<formatting.length; j++) {
closing.push(map[formatting[j]]);
}
if (closing.length) htmlstr += '</' + closing.reverse().join('></') + '>';
return htmlstr;
}
/**
* Convert Endnote XML style elements to text, if applicable including Zotero HTML mark-up
* @param {node} a DOM element
*
* @return {String} The text content
*/
function processField(node, keepNewlines, field) {
if (!node.textContent) {
return '';
} else {
var content = htmlify(node, field);
//don't remove line breaks from abstracts
if (keepNewlines) return content;
else return ZU.trimInternal(content);
}
}
//**********EXPORT Functions
/**
* If property is defined, this function adds an appropriate XML element as a child of
* parentElement. Also converts elements with html mark-up to EndnoteXML style mark-up.
* @param {Element} parentElement The parent of the new element to be created.
* @param {String} elementName The name of the new element to be created.
* @param {Any} property The property to inspect. If this property is defined and not
* null, false, or empty, a new element is created whose textContent is its value.
* @param {Object} [attributes] If defined, this object defines attributes to be added
* to the new element.
*/
function mapProperty(parentElement, elementName, property, attributes) {
if (!property && property !== 0) return null;
var doc = parentElement.ownerDocument,
newElement = doc.createElement(elementName);
if (attributes) {
for (var i in attributes) {
newElement.setAttribute(i, attributes[i]);
}
}
var nodes = convertZoteroMarkup(property);
if (nodes.length == 1 && nodes[0].getAttribute('face') == 'normal') {
//no special formatting, skip the outer style node
newElement.appendChild(nodes[0].firstChild);
} else {
for (var i=0; i<nodes.length; i++) {
newElement.appendChild(nodes[i]);
}
}
parentElement.appendChild(newElement);
return newElement;
}
/**
* Convert Zotero rich text markup to EndNote XML
*
* @param {String} str String to convert
*/
var convertZoteroMarkup = (function() {
//mapping Zotero mark-up to EndNote
var map = {
I: ['italic'],
EM: ['italic'], // TinyMCE
B: ['bold'],
STRONG: ['bold'], // TinyMCE
SUP: ['superscript'],
SUB: ['subscript'],
U: ['underline'], // Because we import it this way into notes
SC: [],
SPAN: ['span']
};
var doc = (new DOMParser()).parseFromString('<foo/>', 'application/xml');
function createFormattedNode(str, format) {
var node = doc.createElement('style');
str = str.replace(/\n{3,}/g, '\n\n'); // Possible if some tags were skipped
if (format.length) {
node.setAttribute('face', format.join(' '));
} else {
node.setAttribute('face', 'normal');
}
node.appendChild(doc.createTextNode(str));
return node;
}
var tagRe = /<(\/?)(\w+)(\s[^>]*)?>/gi;
return function(str) {
// Paragraphs and line breaks get converted to newlines
str = str.replace(/\s*<br\s*\/?>\s*/gi, '\n')
.replace(/(?:\s*<\/p>\s*)+/gi, '\n\n')
.replace(/\s*<p(?:\s.*?)?>\s*/gi, '\n\n')
.trim();
var tags = [],
formatting = [],
currentStr = '',
nextStrStart = 0,
nodes = [],
m;
while (m = tagRe.exec(str)) {
var tagName = m[2].toUpperCase(),
format = map[tagName] || [],
oldFormatting;
if (!m[1]) {
//opening tag
// If "span", need to inspect contents of style attribute
if (tagName == 'SPAN' && m[3] && /\bstyle\s*=/i.test(m[3])) {
// Currently we're only aware of "text-decoration: underline" that is used in tinyMCE
if (/text-decoration\s*:[^'";]*\bunderline\b/.test(m[3])) {
format = ['underline'];
} else {
format = []; // Just drop it
}
}
var formatDiff = ZU.arrayDiff(format, formatting); //only consider new formatting
//push tag so that we know what we're closing later
tags.push({
tagName: tagName,
format: formatDiff
});
oldFormatting = formatting;
formatting = formatting.concat(formatDiff);
} else {
//closing tag
//see if we opened this kind of tag
var j;
for (j=tags.length-1; j>=0; j--) {
if (tags[j].tagName == tagName) break;
}
if (j<0) continue; //never opened. Skip closing tag
//close up tags
var tag, formatDiff = [];
do {
tag = tags.pop();
formatDiff = formatDiff.concat(tag.format);
} while (tag.tagName != tagName);
oldFormatting = formatting;
formatting = ZU.arrayDiff(formatting, formatDiff);
}
//attach substring up to tag
if (nextStrStart < m.index) currentStr += str.substring(nextStrStart, m.index);
nextStrStart = tagRe.lastIndex; //just past the current tag
if (formatDiff.length && currentStr) {
//formatting is changing, create a node for current formatting
nodes.push(createFormattedNode(currentStr, oldFormatting));
currentStr = '';
}
}
if (nextStrStart < str.length) currentStr += str.substring(nextStrStart);
if (currentStr) nodes.push(createFormattedNode(currentStr, formatting));
return nodes;
};
})();
/** BEGIN TEST CASES **/
var testCases = [
{
"type": "import",
"input": "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n<xml>\n <records>\n <record>\n <database name=\"endnote.enl\" path=\"endnote.enl\">endnote.enl</database>\n <ref-type name=\"Report\">10</ref-type>\n <contributors>\n <authors>\n <author>Ahlquist, John S</author>\n <author>Breunig, Christian</author>\n </authors>\n </contributors>\n <titles>\n <title>Country Clustering in Comparative Political Economy</title>\n </titles>\n <periodical/>\n <pages>32</pages>\n <keywords/>\n <dates>\n <year>2009</year>\n </dates>\n <pub-location>Cologne</pub-location>\n <urls>\n <pdf-urls>\n <url>internal-pdf://Ahlquist and Breunig _ 2009 _ Country Clustering in Comparative Political Econom.pdf</url>\n </pdf-urls>\n </urls>\n </record>\n <record>\n <database name=\"endnote.enl\" path=\"endnote.enl\">endnote.enl</database>\n <ref-type name=\"Book\">1</ref-type>\n <contributors>\n <authors>\n <author>Dunnett, Nigel</author>\n <author>Kingsbury, Noël</author>\n </authors>\n </contributors>\n <titles>\n <title>Planting green roofs and living walls</title>\n </titles>\n <periodical/>\n <edition>2</edition>\n <keywords/>\n <dates>\n <year>2008</year>\n </dates>\n <pub-location>Portland, OR</pub-location>\n <publisher>Timber Press</publisher>\n <isbn>0881929115</isbn>\n <urls/>\n <abstract>The latest techniques for planting roofs and walls to enhance our buildings and benefit the environment. The green roof industry is booming and the technology changing fast as professionals respond to the unique challenges of each new planting. In this comprehensively updated, fully revised edition of their authoritative reference, Nigel Dunnett and Nol Kingsbury reveal the very latest techniques, materials, and plants, and showcase some spectacular new case studies for the non-professional. Green roofs and walls reduce pollution and runoff, help insulate and reduce the maintenance needs of buildings, contribute to biodiversity, and provide habitats for wildlife. In addition to all this, they are attractive to look at and enhance the quality of life of residents. In Planting Green Roofs and Living Walls, Revised and Updated Edition, the authors describe and illustrate the practical techniques required to design, implement, and maintain a green roof or wall to the highest standards. This informative, up-to-the-minute reference will encourage gardeners everywhere to consider the enormous benefits to be gained from planting on their roofs and walls.</abstract>\n </record>\n <record>\n <database name=\"endnote.enl\" path=\"endnote.enl\">endnote.enl</database>\n <ref-type name=\"Journal Article\">0</ref-type>\n <contributors>\n <authors>\n <author>Foderaro, Lisa W</author>\n </authors>\n </contributors>\n <titles>\n <title>Rooftop greenhouse will boost city farming</title>\n <secondary-title>New York Times</secondary-title>\n </titles>\n <periodical>\n <full-title>New York Times</full-title>\n </periodical>\n <pages>A20</pages>\n <keywords/>\n <dates>\n <year>2012</year>\n </dates>\n <pub-location>New York</pub-location>\n <urls/>\n </record>\n <record>\n <database name=\"endnote.enl\" path=\"endnote.enl\">endnote.enl</database>\n <ref-type name=\"Book\">1</ref-type>\n <contributors>\n <secondary-authors>\n <author>Hancké, Bob</author>\n <author>Rhodes, Martin</author>\n <author>Thatcher, Mark</author>\n </secondary-authors>\n </contributors>\n <titles>\n <title>Beyond varieties of capitalism : Conflict, contradiction, and complementarities in the European economy</title>\n <short-title>Beyond varieties of capitalism</short-title>\n </titles>\n <periodical/>\n <key
"items": [
{
"itemType": "report",
"title": "Country Clustering in Comparative Political Economy",
"creators": [
{
"firstName": "John S.",
"lastName": "Ahlquist",
"creatorType": "author"
},
{
"firstName": "Christian",
"lastName": "Breunig",
"creatorType": "author"
}
],
"date": "2009",
"pages": "32",
"place": "Cologne",
"attachments": [
{
"title": "Ahlquist and Breunig _ 2009 _ Country Clustering in Comparative Political Econom",
"path": "PDF/Ahlquist and Breunig _ 2009 _ Country Clustering in Comparative Political Econom.pdf",
"mimeType": "application/pdf"
}
],
"tags": [],
"notes": [],
"seeAlso": []
},
{
"itemType": "book",
"title": "Planting green roofs and living walls",
"creators": [
{
"firstName": "Nigel",
"lastName": "Dunnett",
"creatorType": "author"
},
{
"firstName": "Noël",
"lastName": "Kingsbury",
"creatorType": "author"
}
],
"date": "2008",
"ISBN": "0881929115",
"abstractNote": "The latest techniques for planting roofs and walls to enhance our buildings and benefit the environment. The green roof industry is booming and the technology changing fast as professionals respond to the unique challenges of each new planting. In this comprehensively updated, fully revised edition of their authoritative reference, Nigel Dunnett and Nol Kingsbury reveal the very latest techniques, materials, and plants, and showcase some spectacular new case studies for the non-professional. Green roofs and walls reduce pollution and runoff, help insulate and reduce the maintenance needs of buildings, contribute to biodiversity, and provide habitats for wildlife. In addition to all this, they are attractive to look at and enhance the quality of life of residents. In Planting Green Roofs and Living Walls, Revised and Updated Edition, the authors describe and illustrate the practical techniques required to design, implement, and maintain a green roof or wall to the highest standards. This informative, up-to-the-minute reference will encourage gardeners everywhere to consider the enormous benefits to be gained from planting on their roofs and walls.",
"edition": "2",
"place": "Portland, OR",
"publisher": "Timber Press",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
},
{
"itemType": "journalArticle",
"title": "Rooftop greenhouse will boost city farming",
"creators": [
{
"firstName": "Lisa W.",
"lastName": "Foderaro",
"creatorType": "author"
}
],
"date": "2012",
"pages": "A20",
"publicationTitle": "New York Times",
"attachments": [],
"tags": [],
"notes": [
{
"note": "The following values have no corresponding Zotero field:<br/>pub-location: New York",
"tags": [
"_EndnoteXML import"
]
}
],
"seeAlso": []
},
{
"itemType": "book",
"title": "Beyond varieties of capitalism : Conflict, contradiction, and complementarities in the European economy",
"creators": [
{
"firstName": "Bob",
"lastName": "Hancké",
"creatorType": "seriesEditor"
},
{
"firstName": "Martin",
"lastName": "Rhodes",
"creatorType": "seriesEditor"
},
{
"firstName": "Mark",
"lastName": "Thatcher",
"creatorType": "seriesEditor"
}
],
"date": "2007",
"ISBN": "9780199206483",
"place": "Oxford and New York",
"publisher": "Oxford University Press",
"shortTitle": "Beyond varieties of capitalism",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
},
{
"itemType": "book",
"title": "Steve Jobs",
"creators": [
{
"firstName": "Walter",
"lastName": "Isaacson",
"creatorType": "author"
}
],
"date": "2011",
"ISBN": "9781451648539",
"place": "New York, {NY}",
"publisher": "Simon & Schuster",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
},
{
"itemType": "bookSection",
"title": "Firms and the welfare state: When, why, and how does social policy matter to employers?",
"creators": [
{
"firstName": "Isabela",
"lastName": "Mares",
"creatorType": "author"
},
{
"firstName": "Peter A.",
"lastName": "Hall",
"creatorType": "editor"
},
{
"firstName": "David",
"lastName": "Soskice",
"creatorType": "editor"
}
],
"date": "2001",
"bookTitle": "Varieties of capitalism. The institutional foundations of comparative advantage",
"pages": "184-213",
"place": "New York",
"publisher": "Oxford University Press",
"attachments": [],
"tags": [],
"notes": [
{
"note": "The following values have no corresponding Zotero field:<br/>periodical: Varieties of capitalism. The institutional foundations of comparative advantage",
"tags": [
"_EndnoteXML import"
]
}
],
"seeAlso": []
},
{
"itemType": "book",
"title": "Shaping the body politic: Art and political formation in early america",
"creators": [
{
"firstName": "Maurie Dee",
"lastName": "McInnis",
"creatorType": "author"
},
{
"firstName": "Louis P.",
"lastName": "Nelson",
"creatorType": "author"
}
],
"date": "2011",
"ISBN": "0813931029",
"abstractNote": "Traditional narratives imply that art in early America was severely limited in scope. By contrast, these essays collectively argue that visual arts played a critical role in shaping an early American understanding of the body politic. American artists in the late colonial and early national periods enlisted the arts to explore and exploit their visions of the relationship of the American colonies to the mother country and, later, to give material shape to the ideals of modern republican nationhood. Taking a uniquely broad view of both politics and art, Shaping the Body Politic ranges in topic from national politics to the politics of national identity, and from presidential portraits to the architectures of the ordinary. The book covers subject matter from the 1760s to the 1820s, ranging from Patience Wright's embodiment of late colonial political tension to Thomas Jefferson's designs for the entry hall at Monticello as a museum. Paul Staiti, Maurie {McInnis}, and Roger Stein offer new readings of canonical presidential images and spaces: Jean-Antoine Houdon's George Washington, Gilbert Stuart's the Lansdowne portrait of Washington, and Thomas Jefferson's Monticello. In essays that engage print and painting, portraiture and landscape, Wendy Bellion, David Steinberg, and John Crowley explore the formation of national identity. The volume's concluding essays, by Susan Rather and Bernard Herman, examine the politics of the everyday. The accompanying eighty-five illustrations and color plates demonstrate the broad range of politically resonant visual material in early America. {ContributorsWendy} Bellion, University of Delaware * John E. Crowley, Dalhousie University * Bernard L. Herman, University of North Carolina, Chapel Hill * Maurie D. {McInnis}, University of Virginia * Louis P. Nelson, University of Virginia * Susan Rather, University of Texas, Austin * Paul Staiti, Mount Holyoke College * Roger B. Stein, emeritus, University of Virginia * David Steinberg, Independent Scholar Thomas Jefferson Foundation Distinguished Lecture Series",
"place": "Charlottesville, VA",
"publisher": "University of Virginia Press",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
},
{
"itemType": "patent",
"title": "Yo-yo having a modifiable string gap",
"creators": [
{
"firstName": "Hans",
"lastName": "Van Dan Elzen",
"creatorType": "inventor"
}
],
"issueDate": "2011",
"abstractNote": "The invention is a yo-yo that includes unique features that enable a user to adjust the yo-yo's string gap. In the preferred embodiment, at least one of the yo-yo's side assemblies includes a screw engaged to a nut that has two thru-bores located in a side-by-side relation. The screw is located to one side of the yo-yo's axis of rotation and can be rotated by a user to adjust the position of the associated side assembly on the yo-yo's axle structure. By appropriate positioning of the side assembly, a user can adjust the yo-yo's performance characteristics.",
"patentNumber": "WO2011US30214",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
},
{
"itemType": "webpage",
"title": "CSL search by example",
"creators": [],
"url": "http://editor.citationstyles.org/searchByExample/",
"websiteTitle": "Citation Style Editor",
"attachments": [],
"tags": [],
"notes": [
{
"note": "The following values have no corresponding Zotero field:<br/>periodical: Citation Style Editor",
"tags": [
"_EndnoteXML import"
]
}
],
"seeAlso": []
}
]
},
{
"type": "import",
"input": "<?xml version=\"1.0\" encoding=\"UTF-8\" ?><xml><records><record><database name=\"My EndNote Library.enl\" path=\"C:\\BACK_THIS_UP\\Desktop\\My EndNote Library.enl\">My EndNote Library.enl</database><source-app name=\"EndNote\" version=\"16.0\">EndNote</source-app><rec-number>1</rec-number><foreign-keys><key app=\"EN\" db-id=\"dstt999adpex2qeprz9xtt0fe2rrpwtarfwv\">1</key></foreign-keys><ref-type name=\"Journal Article\">17</ref-type><contributors></contributors><titles><title><style face=\"normal\" font=\"default\" size=\"100%\">Plain </style><style face=\"bold\" font=\"default\" size=\"100%\">Bold</style><style face=\"italic\" font=\"default\" size=\"100%\"> Italics</style><style face=\"normal\" font=\"default\" size=\"100%\"> </style><style face=\"underline\" font=\"default\" size=\"100%\">Underline</style><style face=\"normal\" font=\"default\" size=\"100%\"> </style><style face=\"superscript\" font=\"default\" size=\"100%\">Superscript</style><style face=\"normal\" font=\"default\" size=\"100%\"> </style><style face=\"subscript\" font=\"default\" size=\"100%\">Subscript</style><style face=\"normal\" font=\"default\" size=\"100%\"> </style><style face=\"normal\" font=\"Symbol\" charset=\"2\" size=\"100%\">SymbolFont</style><style face=\"normal\" font=\"default\" size=\"100%\"> </style><style face=\"normal\" font=\"Courier New\" size=\"100%\">CourierNew</style><style face=\"normal\" font=\"default\" size=\"100%\"> </style><style face=\"normal\" font=\"default\" size=\"7\">SmallerSize</style><style face=\"normal\" font=\"default\" size=\"100%\"> </style><style face=\"normal\" font=\"default\" size=\"12\">Size12 </style><style face=\"bold italic underline superscript\" font=\"Times New Roman\" size=\"100%\">TimesNewRoman-Bold-Italics-Underline-Superscript</style></title></titles><dates></dates><urls></urls></record></records></xml>",
"items": [
{
"itemType": "journalArticle",
"title": "Plain <b>Bold</b><i> Italics</i> Underline <sup>Superscript</sup> <sub>Subscript</sub> SymbolFont CourierNew SmallerSize Size12 <b><i><sup>TimesNewRoman-Bold-Italics-Underline-Superscript</sup></i></b>",
"creators": [],
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
}
]
}
]
/** END TEST CASES **/