ThisTest/translators/DBLP Computer Science Bibli...

386 lines
11 KiB
JavaScript
Raw Normal View History

2022-03-23 12:58:01 +01:00
{
"translatorID": "625c6435-e235-4402-a48f-3095a9c1a09c",
"label": "DBLP Computer Science Bibliography",
"creator": "Sebastian Karcher, Philipp Zumstein",
"target": "^https?://(www\\.)?(dblp\\d?(\\.org|\\.uni-trier\\.de/|\\.dagstuhl\\.de/))",
"minVersion": "3.0",
"maxVersion": "",
"priority": 100,
"inRepository": true,
"translatorType": 4,
"browserSupport": "gcsibv",
"lastUpdated": "2020-05-03 20:02:38"
}
/*
***** BEGIN LICENSE BLOCK *****
Copyright © 2011-2019 Sebastian Karcher, Philipp Zumstein
This file is part of Zotero.
Zotero is free software: you can redistribute it and/or modify
it under the terms of the GNU Affero General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
Zotero is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU Affero General Public License for more details.
You should have received a copy of the GNU Affero General Public License
along with Zotero. If not, see <http://www.gnu.org/licenses/>.
***** END LICENSE BLOCK *****
*/
function detectWeb(doc, url) {
if (url.includes('rec/bibtex') || url.includes('rec/html')) {
if (url.includes('journals')) {
return "journalArticle";
}
else if (url.includes('conf')) {
return "conferencePaper";
}
else if (url.includes('series') || url.includes('reference')) {
return "bookSection";
}
else if (url.includes('books')) {
return "book";
}
else if (url.includes('phd')) {
return "thesis";
}
else { // generic fallback
return "journalArticle";
}
}
else if ((url.match(/\/db\/(journals|conf|series|reference)/) || url.match(/\/pers\/(hd|ht|hy)/)) && !url.match(/index[\w-]*\.html/) || url.includes("/search?q=")) {
return "multiple";
}
return false;
}
function scrape(doc, _url) {
var xPathAllData = doc.evaluate('//pre', doc, null, XPathResult.ANY_TYPE, null);
var firstData = xPathAllData.iterateNext(); // only if exists
var firstDataText = firstData.textContent.replace(/ ee\s*=/, " url ="); // e.g. ee = {http://dx.doi.org/10.1007/978-3-319-00035-0_37},
// conferencePapers and bookSections are linked in DBLP
// with the crossref field to the second BibTeX entry
// for the proceeding or book. In these cases the following
// lines (if-part) are handling the second entry and extracting
// relevant fields and save it (later) to the main entry.
var secondData = xPathAllData.iterateNext();
if (secondData) {
var secondDataText = secondData.textContent;
var trans = Zotero.loadTranslator('import');
trans.setTranslator('9cb70025-a888-4a29-a210-93ec52da40d4');// https://github.com/zotero/translators/blob/master/BibTeX.js
trans.setString(secondDataText);
trans.setHandler('itemDone', function (obj, item) {
scrapeMainPart(firstDataText, item);
});
trans.translate();
}
else { // if there are no secondData: scrape without additional data
scrapeMainPart(firstDataText, null);
}
}
function scrapeMainPart(firstDataText, secondDataItem) {
// scrape from the firstDataText and if secondDataItem
// is not null, add/update these information
var trans = Zotero.loadTranslator('import');
trans.setTranslator('9cb70025-a888-4a29-a210-93ec52da40d4');// https://github.com/zotero/translators/blob/master/BibTeX.js
trans.setString(firstDataText);
trans.setHandler('itemDone', function (obj, item) {
if (secondDataItem) {
if (secondDataItem.title && item.itemType == "conferencePaper") item.proceedingsTitle = secondDataItem.title;
if (secondDataItem.title && item.itemType == "bookSection") item.booktitle = secondDataItem.titel;
if (secondDataItem.creators && secondDataItem.creators.length > 0) item.creators = item.creators.concat(secondDataItem.creators);
if (secondDataItem.publisher && !item.publisher) item.publisher = secondDataItem.publisher;
if (secondDataItem.series && !item.series) item.series = secondDataItem.series;
if (secondDataItem.volume && !item.volume) item.volume = secondDataItem.volume;
if (secondDataItem.ISBN && !item.ISBN) item.ISBN = secondDataItem.ISBN;
}
// Assume that the url contains an doi. If the item does not
// yet contain a doi, then save the doi and delete the url.
// If the item contains the doi corresponding to the url
// then just delete the url and keep the doi.
if (item.url && item.url.search(/^https?:\/\/(?:dx\.)?doi\.org\/10\./i) != -1) {
var doi = ZU.cleanDOI(item.url);
if (doi && (!item.DOI || item.DOI == doi)) {
item.DOI = doi;
delete item.url;
}
}
item.complete();
});
trans.translate();
}
function doWeb(doc, url) {
if (detectWeb(doc, url) == "multiple") {
var items = {};
var articles = [];
var rows = ZU.xpath(doc, '//body/ul/li|//li[contains(@class, "entry")]');
for (let i = 0; i < rows.length; i++) {
// Careful: If you get more than one node,
// ZU.xpathText will join the textContent of each with commas.
var title = ZU.xpathText(rows[i], './/span[@class="title"]');
var link = ZU.xpathText(rows[i], './a[contains(@href, "rec/bibtex") and not(contains(@href, ".xml"))]/@href|./nav//div/a[contains(@href, "rec/bibtex") and not(contains(@href, ".xml"))]/@href');
items[link] = title;
}
Zotero.selectItems(items, function (items) {
if (!items) {
return;
}
for (let i in items) {
articles.push(i);
}
ZU.processDocuments(articles, scrape);
});
}
else if (url.includes('rec/html')) {
ZU.processDocuments([url.replace('rec/html', 'rec/bibtex')], scrape);
}
else {
scrape(doc, url);
}
}
/** BEGIN TEST CASES **/
var testCases = [
{
"type": "web",
"url": "https://dblp.org/rec/bibtex/journals/cssc/XuY12",
"items": [
{
"itemType": "journalArticle",
"title": "On the Preliminary Test Backfitting and Speckman Estimators in Partially Linear Models and Numerical Comparisons",
"creators": [
{
"firstName": "Jianwen",
"lastName": "Xu",
"creatorType": "author"
},
{
"firstName": "Hu",
"lastName": "Yang",
"creatorType": "author"
}
],
"date": "2012",
"DOI": "10.1080/03610918.2011.588356",
"issue": "3",
"itemID": "DBLP:journals/cssc/XuY12",
"libraryCatalog": "DBLP Computer Science Bibliography",
"pages": "327341",
"publicationTitle": "Communications in Statistics - Simulation and Computation",
"volume": "41",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
}
]
},
{
"type": "web",
"url": "https://dblp.org/rec/bibtex/conf/ats/KochteZBIWHCP10",
"items": [
{
"itemType": "conferencePaper",
"title": "Efficient Simulation of Structural Faults for the Reliability Evaluation at System-Level",
"creators": [
{
"firstName": "Michael A.",
"lastName": "Kochte",
"creatorType": "author"
},
{
"firstName": "Christian G.",
"lastName": "Zoellin",
"creatorType": "author"
},
{
"firstName": "Rafal",
"lastName": "Baranowski",
"creatorType": "author"
},
{
"firstName": "Michael E.",
"lastName": "Imhof",
"creatorType": "author"
},
{
"firstName": "Hans-Joachim",
"lastName": "Wunderlich",
"creatorType": "author"
},
{
"firstName": "Nadereh",
"lastName": "Hatami",
"creatorType": "author"
},
{
"firstName": "Stefano Di",
"lastName": "Carlo",
"creatorType": "author"
},
{
"firstName": "Paolo",
"lastName": "Prinetto",
"creatorType": "author"
}
],
"date": "2010",
"DOI": "10.1109/ATS.2010.10",
"itemID": "DBLP:conf/ats/KochteZBIWHCP10",
"libraryCatalog": "DBLP Computer Science Bibliography",
"pages": "38",
"proceedingsTitle": "Proceedings of the 19th IEEE Asian Test Symposium, ATS 2010, 1-4 December 2010, Shanghai, China",
"publisher": "IEEE Computer Society",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
}
]
},
{
"type": "web",
"url": "https://dblp1.uni-trier.de/db/journals/tois/tois25.html",
"items": "multiple"
},
{
"type": "web",
"url": "https://dblp.uni-trier.de/db/journals/tods/tods31.html",
"items": "multiple"
},
{
"type": "web",
"url": "https://dblp.dagstuhl.de/pers/hd/k/Knuth:Donald_E=.html",
"items": "multiple"
},
{
"type": "web",
"url": "https://dblp.uni-trier.de/rec/bibtex/conf/approx/SchederT13",
"items": [
{
"itemType": "conferencePaper",
"title": "On the Average Sensitivity and Density of k-CNF Formulas",
"creators": [
{
"firstName": "Dominik",
"lastName": "Scheder",
"creatorType": "author"
},
{
"firstName": "Li-Yang",
"lastName": "Tan",
"creatorType": "author"
},
{
"firstName": "Prasad",
"lastName": "Raghavendra",
"creatorType": "editor"
},
{
"firstName": "Sofya",
"lastName": "Raskhodnikova",
"creatorType": "editor"
},
{
"firstName": "Klaus",
"lastName": "Jansen",
"creatorType": "editor"
},
{
"firstName": "José D. P.",
"lastName": "Rolim",
"creatorType": "editor"
}
],
"date": "2013",
"DOI": "10.1007/978-3-642-40328-6_47",
"itemID": "DBLP:conf/approx/SchederT13",
"libraryCatalog": "DBLP Computer Science Bibliography",
"pages": "683698",
"proceedingsTitle": "Approximation, Randomization, and Combinatorial Optimization. Algorithms and Techniques - 16th International Workshop, APPROX 2013, and 17th International Workshop, RANDOM 2013, Berkeley, CA, USA, August 21-23, 2013. Proceedings",
"publisher": "Springer",
"series": "Lecture Notes in Computer Science",
"volume": "8096",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
}
]
},
{
"type": "web",
"url": "https://dblp.org/rec/html/conf/iclr/DasMYTM19",
"items": [
{
"itemType": "conferencePaper",
"title": "Building Dynamic Knowledge Graphs from Text using Machine Reading Comprehension",
"creators": [
{
"firstName": "Rajarshi",
"lastName": "Das",
"creatorType": "author"
},
{
"firstName": "Tsendsuren",
"lastName": "Munkhdalai",
"creatorType": "author"
},
{
"firstName": "Xingdi",
"lastName": "Yuan",
"creatorType": "author"
},
{
"firstName": "Adam",
"lastName": "Trischler",
"creatorType": "author"
},
{
"firstName": "Andrew",
"lastName": "McCallum",
"creatorType": "author"
}
],
"date": "2019",
"itemID": "DBLP:conf/iclr/DasMYTM19",
"libraryCatalog": "DBLP Computer Science Bibliography",
"proceedingsTitle": "7th International Conference on Learning Representations, ICLR 2019, New Orleans, LA, USA, May 6-9, 2019",
"publisher": "OpenReview.net",
"url": "https://openreview.net/forum?id=S1lhbnRqF7",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
}
]
},
{
"type": "web",
"url": "https://dblp.org/search?q=zotero",
"items": "multiple"
}
]
/** END TEST CASES **/