229 lines
7.2 KiB
JavaScript
229 lines
7.2 KiB
JavaScript
{
|
|
"translatorID": "88e11bcb-464d-4b6d-a446-8994e3b865c9",
|
|
"label": "Web of Science",
|
|
"creator": "Philipp Zumstein",
|
|
"target": "^https?://([^/]+\\.)?webofknowledge\\.com/",
|
|
"minVersion": "3.0",
|
|
"maxVersion": "",
|
|
"priority": 100,
|
|
"inRepository": true,
|
|
"translatorType": 4,
|
|
"browserSupport": "gcsib",
|
|
"lastUpdated": "2015-06-04 04:20:22"
|
|
}
|
|
|
|
/*
|
|
***** BEGIN LICENSE BLOCK *****
|
|
|
|
Copyright © 2015 Philipp Zumstein
|
|
|
|
This file is part of Zotero.
|
|
|
|
Zotero is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU Affero General Public License as published by
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
Zotero is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU Affero General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Affero General Public License
|
|
along with Zotero. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
***** END LICENSE BLOCK *****
|
|
*/
|
|
|
|
function detectWeb(doc, url) {
|
|
if ( (url.includes("full_record.do")
|
|
|| url.includes("CitedFullRecord.do")
|
|
|| url.includes("InboundService.do") )
|
|
&& getSingleItemId(doc)
|
|
) {
|
|
return "journalArticle";
|
|
} else if (((doc.title.includes(" Results"))
|
|
|| url.includes("search_mode="))
|
|
&& getRecords(doc).length) {
|
|
return "multiple";
|
|
}
|
|
}
|
|
|
|
function getRecords(doc) {
|
|
return ZU.xpath(doc, '//span[@id="records_chunks"]//div[starts-with(@id,"RECORD_")]');
|
|
}
|
|
|
|
function getSingleItemId(doc) {
|
|
var form = doc.forms['records_form'];
|
|
if (form) return (form.elements.namedItem('marked_list_candidates') || {}).value;
|
|
|
|
return false;
|
|
}
|
|
|
|
function doWeb(doc, url) {
|
|
var ids = new Array();
|
|
if (detectWeb(doc, url) == "multiple") {
|
|
var items = new Object;
|
|
var records = getRecords(doc);
|
|
var recordID, title;
|
|
for (var i=0, n=records.length; i<n; i++) {
|
|
recordID = ZU.xpathText(records[i], './/input[@name="marked_list_candidates"]/@value');
|
|
title = ZU.xpathText(records[i], './/a[contains(@href, "/full_record.do?")]|.//a[contains(@href, "/CitedFullRecord.do?")]');
|
|
|
|
if (!title || !recordID) continue;
|
|
|
|
items[recordID] = title.trim();
|
|
}
|
|
|
|
Zotero.selectItems(items, function (items) {
|
|
if (!items) return true;
|
|
|
|
var ids = [];
|
|
for (var i in items) {
|
|
ids.push(i);
|
|
}
|
|
|
|
// Due to a long-standing bug in connectors, when no items are selected,
|
|
// an empty object is returned instead of false, so we actually do get to
|
|
// this point. Furthermore, WoS appears to export all results if no IDs
|
|
// are supplied. So this is a hack to avoid this very special case.
|
|
// See https://github.com/zotero/zotero-connectors/pull/36
|
|
if (!ids.length) return true;
|
|
|
|
fetchIds(ids, doc);
|
|
});
|
|
} else {
|
|
fetchIds([getSingleItemId(doc)], doc);
|
|
}
|
|
}
|
|
|
|
function getHiddenValues(form) {
|
|
var inputs = form.elements;
|
|
var values = {};
|
|
var node;
|
|
for (var i=0; node = inputs.item(i); i++) {
|
|
if (node.type == 'hidden') {
|
|
values[node.name] = node.value;
|
|
}
|
|
}
|
|
return values;
|
|
}
|
|
|
|
function serializePostData(data) {
|
|
var str = '';
|
|
for (var i in data) {
|
|
str += '&' + encodeURIComponent(i) + '='
|
|
+ encodeURIComponent(data[i]).replace(/%20/g, "+");
|
|
}
|
|
return str.substr(1);
|
|
}
|
|
|
|
function getOutputForm(doc) {
|
|
return doc.forms['output_form'] || doc.forms['records_form'] || doc.forms['summary_records_form'];
|
|
}
|
|
|
|
function importISIRecord(text) {
|
|
Z.debug(text);
|
|
var importer = Zotero.loadTranslator("import");
|
|
importer.setTranslator("594ebe3c-90a0-4830-83bc-9502825a6810");
|
|
importer.setString(text);
|
|
importer.setHandler('itemDone', function(obj, item) {
|
|
if (item.title.toUpperCase() == item.title) {
|
|
item.title = ZU.capitalizeTitle(item.title, true);
|
|
}
|
|
|
|
var creator;
|
|
for (var i=0, n=item.creators.length; i<n; i++) {
|
|
creator = item.creators[i];
|
|
if (creator.firstName.toUpperCase() == creator.firstName) {
|
|
creator.firstName = ZU.capitalizeTitle(creator.firstName, true);
|
|
}
|
|
if (creator.lastName.toUpperCase() == creator.lastName) {
|
|
creator.lastName = ZU.capitalizeTitle(creator.lastName, true);
|
|
}
|
|
}
|
|
item.complete();
|
|
});
|
|
importer.translate();
|
|
}
|
|
|
|
function fetchIds(ids, doc) {
|
|
var outputForm = getOutputForm(doc);
|
|
var postData = getHiddenValues(outputForm);
|
|
var filters = 'USAGEIND RESEARCHERID ACCESSION_NUM FUNDING SUBJECT_CATEGORY '
|
|
+ 'JCR_CATEGORY LANG IDS PAGEC SABBR CITREFC ISSN PUBINFO KEYWORDS '
|
|
+ 'CITTIMES ADDRS CONFERENCE_SPONSORS DOCTYPE ABSTRACT CONFERENCE_INFO '
|
|
+ 'SOURCE TITLE AUTHORS '
|
|
//additional fields from INSPEC
|
|
+ 'ADDRESS AUTHORS_EDITORS AUTHORSIDENTIFIERS CLASSIFICATION_CODES '
|
|
+ 'CONFERENCE_SPONSORS DESCRIPTORS IDENTIFYING_CODES IMAGES '
|
|
+ 'INVENTORS_ASSIGNEES IPC NUM_OF_REF PATENT_INFO SPONSORS TRANSLATORS '
|
|
+ 'TREATMENT UNCONTROLLED_TERMS';
|
|
postData['value(record_select_type)'] = 'selrecords';
|
|
postData['markFrom'] = '';
|
|
postData['markTo'] = '';
|
|
postData['fields_selection'] = filters;
|
|
postData['filters'] = filters;
|
|
postData['save_options'] = 'othersoftware';
|
|
postData['format'] = 'saveToRef';
|
|
|
|
//add selected items
|
|
var selectedIds = ids.join(';');
|
|
postData['selectedIds'] = selectedIds;
|
|
|
|
var postUrl = outputForm.action;
|
|
Z.debug("Posting to " + postUrl);
|
|
/**
|
|
* Note that when using the form on the page, the request ends up redirecting
|
|
* to ets.webofknowledge.com which makes it cross-origin. Somehow, this POST
|
|
* avoids the redirect, so things just work, but if the behavior changes in
|
|
* the future, it would break scraping on IE/bookmarklet and Safari
|
|
*/
|
|
ZU.doPost(postUrl, serializePostData(postData), function (text) {
|
|
//check if there's an intermediate page
|
|
if (text.indexOf('FN ') === 0) {
|
|
importISIRecord(text);
|
|
return;
|
|
}
|
|
|
|
//otherwise we have an intermediate page (maybe... it just kind of went away one day)
|
|
//everything it mostly the same as above except for a few fields
|
|
var postData2 = {};
|
|
postData2['locale'] = postData['locale'];
|
|
postData2['colName'] = postData['colName'];
|
|
postData2['sortBy'] = postData['sortBy'];
|
|
postData2['SID'] = postData['SID'];
|
|
postData2['filters'] = postData['filters'];
|
|
postData2['fileOpt'] = 'fieldtagged';
|
|
postData2['action'] = 'saveDataToRef';
|
|
postData2['product'] = 'UA';
|
|
postData2['numRecords'] = ids.length;
|
|
postData2['numRecsToRetrieve'] = 500;
|
|
|
|
var qid = text.match(/<input[^>]+name=(['"]?)qid\1[\s\/][^>]*/);
|
|
if (qid) qid = qid[0].match(/value=['"]?(\d+)/);
|
|
if (qid) {
|
|
qid = qid[1];
|
|
} else {
|
|
qid = postData['qid']*1+1; //this can be wrong if pages are refreshed
|
|
Z.debug("Could not find qid on page. Using 1 + previous qid: " + qid);
|
|
text = text.replace(/\s*[\r\n]\s*/g, '\n'); //trim out the extra newlines
|
|
var forms = text.match(/<form[\s\S]+?<\/form>/ig);
|
|
if (forms) {
|
|
Z.debug("Page contained the following forms:");
|
|
Z.debug(forms.join('\n==============================\n'));
|
|
} else {
|
|
Z.debug("Could not find any forms on the page. Here's the whole HTML");
|
|
Z.debug(text);
|
|
}
|
|
}
|
|
postData2['qid'] = qid;
|
|
|
|
var postUrl2 = 'http://ets.webofknowledge.com/ETS/saveDataToRef.do'; //Zotero should take care of proxies
|
|
ZU.doPost(postUrl2, serializePostData(postData2), function(text) {
|
|
importISIRecord(text);
|
|
}, { 'Referer': postUrl });
|
|
|
|
}, { 'Referer': doc.location.href });
|
|
}
|