175 lines
6.2 KiB
JavaScript
175 lines
6.2 KiB
JavaScript
{
|
|
"translatorID": "d9a16cf3-8b86-4cab-8610-dbd913ad1a44",
|
|
"label": "Archives Canada-France",
|
|
"creator": "Adam Crymble",
|
|
"target": "^https?://bd\\.archivescanadafrance\\.org",
|
|
"minVersion": "1.0.0b4.r5",
|
|
"maxVersion": "",
|
|
"priority": 100,
|
|
"browserSupport": "gcsibv",
|
|
"inRepository": true,
|
|
"translatorType": 4,
|
|
"lastUpdated": "2012-01-01 01:42:16"
|
|
}
|
|
|
|
function detectWeb(doc, url) {
|
|
|
|
if (doc.location.href.match("doc.xsp?")) {
|
|
return "book";
|
|
} else if (doc.evaluate('//li/a', doc, null, XPathResult.ANY_TYPE, null).iterateNext()) {
|
|
return "multiple";
|
|
} else if (doc.evaluate('//td[1][@class="icones"]/a', doc, null, XPathResult.ANY_TYPE, null).iterateNext()) {
|
|
return "multiple";
|
|
}
|
|
}
|
|
|
|
function associateData (newItem, dataTags, field, zoteroField) {
|
|
if (dataTags[field]) {
|
|
newItem[zoteroField] = dataTags[field];
|
|
}
|
|
}
|
|
|
|
function scrape(doc, url) {
|
|
|
|
var namespace = doc.documentElement.namespaceURI;
|
|
var nsResolver = namespace ? function(prefix) {
|
|
if (prefix == 'x') return namespace; else return null;
|
|
} : null;
|
|
|
|
var dataTags = new Object();
|
|
var tagsContent = new Array();
|
|
var fieldTitle;
|
|
|
|
var newItem = new Zotero.Item("book");
|
|
var xPathHeaders = '//td[2]/div[@class="ead-c"]/div[@class="ead-did"]/table[@class="ead-did"]/tbody/tr/td[1]';
|
|
|
|
if (doc.evaluate(xPathHeaders, doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext()) {
|
|
var headers = doc.evaluate(xPathHeaders, doc, nsResolver, XPathResult.ANY_TYPE, null);
|
|
var contents = doc.evaluate('//td[2][@class="did-content"]', doc, nsResolver, XPathResult.ANY_TYPE, null);
|
|
|
|
while (fieldTitle = headers.iterateNext()) {
|
|
fieldTitle = fieldTitle.textContent.replace(/\s+/g, '');
|
|
if (fieldTitle == "Origination" || fieldTitle == "Origine") {
|
|
fieldTitle = "Origination";
|
|
}
|
|
dataTags[fieldTitle] = Zotero.Utilities.cleanTags(contents.iterateNext().textContent.replace(/^\s*|\s*$/g, ''));
|
|
}
|
|
|
|
if (dataTags["Origination"]) {
|
|
var author = dataTags["Origination"];
|
|
if (!author.match(", ")) {
|
|
newItem.creators.push({lastName: author, creatorType: "author"});
|
|
} else {
|
|
var authors = author.split(", ");
|
|
author = authors[1] + " " + authors[0];
|
|
newItem.creators.push(Zotero.Utilities.cleanAuthor(author, "author"));
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
if (doc.evaluate('//h1[@class="doc-title"]', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext()) {
|
|
newItem.title = doc.evaluate('//h1[@class="doc-title"]', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext().textContent;
|
|
} else if (doc.evaluate('//td[2]/div[@class="notice"]/p', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext()) {
|
|
newItem.title = doc.evaluate('//td[2]/div[@class="notice"]/p', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext().textContent;
|
|
} else {
|
|
newItem.title = doc.title + " Title Not Found";
|
|
}
|
|
|
|
associateData (newItem, dataTags, "PhysicalDescription", "pages");
|
|
associateData (newItem, dataTags, "Descriptionmatérielle", "pages");
|
|
|
|
associateData (newItem, dataTags, "Repository", "repository");
|
|
associateData (newItem, dataTags, "Lieudeconservation", "repository");
|
|
|
|
associateData (newItem, dataTags, "LanguageoftheMaterial", "language");
|
|
associateData (newItem, dataTags, "Langue", "language");
|
|
|
|
associateData (newItem, dataTags, "Identifier", "callNumber");
|
|
associateData (newItem, dataTags, "Cote", "callNumber");
|
|
|
|
associateData (newItem, dataTags, "Datesextrêmes", "date");
|
|
associateData (newItem, dataTags, "Dates", "date");
|
|
|
|
newItem.url = doc.location.href;
|
|
newItem.complete();
|
|
}
|
|
|
|
function doWeb(doc, url) {
|
|
var namespace = doc.documentElement.namespaceURI;
|
|
var nsResolver = namespace ? function(prefix) {
|
|
if (prefix == 'x') return namespace; else return null;
|
|
} : null;
|
|
|
|
var articles = new Array();
|
|
|
|
if (detectWeb(doc, url) == "multiple") {
|
|
|
|
var items = new Object();
|
|
|
|
if (doc.evaluate('//td[1][@class="icones"]/a', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext()) {
|
|
var titles = doc.evaluate('//td[2][@class="ressource"]', doc, nsResolver, XPathResult.ANY_TYPE, null);
|
|
var titlesCount = doc.evaluate('count (//td[2][@class="ressource"])', doc, nsResolver, XPathResult.ANY_TYPE, null);
|
|
var links = doc.evaluate('//td[1][@class="icones"]/a', doc, nsResolver, XPathResult.ANY_TYPE, null);
|
|
|
|
var next_link;
|
|
|
|
for (var i = 0; i < titlesCount.numberValue; i++) {
|
|
next_link = links.iterateNext().href;
|
|
if (!next_link.match("doc.xsp")) {
|
|
next_link = links.iterateNext().href;
|
|
}
|
|
items[next_link] = titles.iterateNext().textContent;
|
|
}
|
|
}
|
|
|
|
if (doc.evaluate('//li/a', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext()) {
|
|
var titles = doc.evaluate('//li/a', doc, nsResolver, XPathResult.ANY_TYPE, null);
|
|
var next_title;
|
|
while (next_title = titles.iterateNext()) {
|
|
items[next_title.href] = next_title.textContent;
|
|
}
|
|
}
|
|
|
|
items = Zotero.selectItems(items);
|
|
for (var i in items) {
|
|
articles.push(i);
|
|
}
|
|
|
|
} else if (doc.evaluate('//div[@class="ancestor"]/a', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext()) {
|
|
|
|
var link = doc.evaluate('//div[@class="ancestor"]/a', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext().href;
|
|
|
|
articles = [link];
|
|
} else {
|
|
articles = [url]
|
|
}
|
|
Zotero.Utilities.processDocuments(articles, scrape, function() {Zotero.done();});
|
|
Zotero.wait();
|
|
}/** BEGIN TEST CASES **/
|
|
var testCases = [
|
|
{
|
|
"type": "web",
|
|
"url": "http://bd.archivescanadafrance.org/sdx-222-acf-pleade-2/acf/search-acf.xsp?sq1=montreal&fi1=fulltext&sq2=&fi2=fulltext&sq3=&fi3=fulltext&ed=&dbeg=&dend=&frepo=&forig=&x=0&y=0#resume",
|
|
"items": "multiple"
|
|
},
|
|
{
|
|
"type": "web",
|
|
"url": "http://bd.archivescanadafrance.org/sdx-222-acf-pleade-2/acf/doc.xsp?id=CAANQ_PISTARD_03Q808_392_CAANQ_PISTARD_03Q808_392&qid=sdx_q0&fmt=tab&base=fa&n=5&root=CAANQ_PISTARD_03Q808_392&ss=true&as=&ai=&from=",
|
|
"items": [
|
|
{
|
|
"itemType": "book",
|
|
"creators": [],
|
|
"notes": [],
|
|
"tags": [],
|
|
"seeAlso": [],
|
|
"attachments": [],
|
|
"title": "Fonds Intendants",
|
|
"url": "http://bd.archivescanadafrance.org/sdx-222-acf-pleade-2/acf/doc.xsp?id=ANQ_00001_intendants&fmt=tab&base=fa&root=CAANQ_PISTARD_03Q808_392&n=5&qid=sdx_q0&ss=true&as=&ai=",
|
|
"libraryCatalog": "Archives Canada-France",
|
|
"accessDate": "CURRENT_TIMESTAMP"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
/** END TEST CASES **/ |