zotero/translators/Library Catalog (Dynix).js
2011-08-11 07:01:19 +00:00

237 lines
7.0 KiB
JavaScript

{
"translatorID": "774d7dc2-3474-2684-392c-f787789ec63d",
"label": "Library Catalog (Dynix)",
"creator": "Simon Kornblith and Sylvain Machefert",
"target": "ipac\\.jsp\\?.*(?:uri=(?:link|full)=[0-9]|menu=search|term=)",
"minVersion": "2.1",
"maxVersion": "",
"priority": 100,
"inRepository": true,
"translatorType": 4,
"lastUpdated": "2011-07-24 19:43:47"
}
function detectWeb(doc, url) {
var namespace = doc.documentElement.namespaceURI;
var nsResolver = namespace ? function(prefix) {
if (prefix == 'x') return namespace; else return null;
} : null;
// make sure there are multiple results, check to see if the search results number exists
var xpath = '/html/body/table[4]/tbody/tr[2]/td[1]/table/tbody/tr[2]/td/a/b[1]';
var detailsRe = new RegExp('ipac\.jsp\?.*uri=(?:full|link)=[0-9]');
if(detailsRe.test(doc.location.href)) {
return "book";
} else if(!doc.evaluate(xpath, doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext()) { // this hack catches search results w/ single items
return "book";
} else {
return "multiple";
}
}
function doWeb(doc, url) {
var namespace = doc.documentElement.namespaceURI;
var nsResolver = namespace ? function(prefix) {
if (prefix == 'x') return namespace; else return null;
} : null;
var uri = doc.location.href;
var detailsRe = new RegExp('ipac\.jsp\?.*uri=(?:full|link)=[0-9]');
var uris = new Array();
if(detectWeb(doc,uri) == "book") {
if (uri.indexOf("#") !== -1)
uris.push(uri.replace(/#/,'&fullmarc=true#'));
else
uris.push(uri+'&fullmarc=true');
} else {
var items = Zotero.Utilities.getItemArray(doc, doc, "ipac\.jsp\?.*uri=(?:full|link)=[0-9]|^javascript:buildNewList\\('.*uri%3Dfull%3D[0-9]", "Show details");
items = Zotero.selectItems(items);
if(!items) {
return true;
}
var buildNewList = new RegExp("^javascript:buildNewList\\('([^']+)");
var uris = new Array();
for(var i in items) {
var m = buildNewList.exec(i);
if(m) {
uris.push(unescape(m[1]+'&fullmarc=true'));
} else {
uris.push(i+'&fullmarc=true');
}
}
}
var translator = Zotero.loadTranslator("import");
translator.setTranslator("a6ee60df-1ddc-4aae-bb25-45e0537be973");
translator.getTranslatorObject(function (marc) {
Zotero.Utilities.processDocuments(uris, function (newDoc) {
scrape(newDoc, marc);
}, function() { Zotero.done() }, null);
});
Zotero.wait();
}
function scrape(newDoc, marc) {
var uri = newDoc.location.href;
var namespace = newDoc.documentElement.namespaceURI;
var nsResolver = namespace ? function(prefix) {
if (prefix == 'x') return namespace; else return null;
} : null;
var xpath = '//form/table[@class="tableBackground"]/tbody/tr/td/table[@class="tableBackground"]/tbody/tr[td[1]/a[@class="normalBlackFont1"]]';
var elmts = newDoc.evaluate(xpath, newDoc, nsResolver, XPathResult.ANY_TYPE, null);
if (!elmts.iterateNext()) {
var xpath2 = '//form/table[@class="tableBackground"]/tbody/tr/td/table[@class="tableBackground"]/tbody/tr[td[1]/a[@class="boldBlackFont1"]]';
var elmts = newDoc.evaluate(xpath2, newDoc, nsResolver, XPathResult.ANY_TYPE, null);
}
else
{
// Added to restart the evaluation. Otherwise, because of the iteratenext
// used 5 lines above to test the xpath, we miss the first line (LDR)
elmts = newDoc.evaluate(xpath, newDoc, nsResolver, XPathResult.ANY_TYPE, null);
}
var elmt;
var record = new marc.record();
while(elmt = elmts.iterateNext()) {
var field = Zotero.Utilities.superCleanString(newDoc.evaluate('./TD[1]/A[1]/text()[1]', elmt, nsResolver, XPathResult.ANY_TYPE, null).iterateNext().nodeValue);
var value = newDoc.evaluate('./TD[2]/TABLE[1]/TBODY[1]/TR[1]/TD[1]/A[1]', elmt, nsResolver, XPathResult.ANY_TYPE, null).iterateNext();
// value = null for non-marc table entries w/ that xpath
if (!value) {
value = '';
} else {
value = value.textContent;
}
// Sometimes, the field contains "LDR: ", "001: ". We can delete these extra characters
field = field.replace(/[\s:]/g, "");
if (field == "LDR"){
record.leader = value;
} else if(field != "FMT") {
// In french catalogs (in unimarc), the delimiter isn't the $ but \xA4 is used. Added there
// Also added the fact that subfield codes can be numerics
value = value.replace(/[\xA4\$]([a-z0-9]) /g, marc.subfieldDelimiter+"$1");
var code = field.substring(0, 3);
var ind = "";
if(field.length > 3) {
ind = field[3];
if(field.length > 4) {
ind += field[4];
}
}
record.addField(code, ind, value);
}
}
var newItem = new Zotero.Item();
record.translate(newItem);
var domain = uri.match(/https?:\/\/([^/]+)/);
newItem.repository = domain[1]+" Library Catalog";
// 20091210 : We try to get a permalink on the record
var perma = uri.match(/(https?:\/\/[^/]+.*ipac\.jsp\?).*(uri\=[^&]*)/);
var profile = uri.match(/(profile\=[^&]*)/);
if (perma && perma[1] && perma[2])
{
var permalink = perma[1] + perma[2];
// Sometimes, for libraries with multiple profiles, it can be useful
// to store the permalink with the profile used
if (profile)
{
permalink = permalink + "&" + profile[1];
}
newItem.attachments = [{url:permalink, title:"Original record", mimeType:"text/html", snapshot:false}];
}
else
{
Zotero.debug("Unable to create permalink on " + uri);
}
newItem.complete();
}
/** BEGIN TEST CASES **/
var testCases = [
{
"type": "web",
"url": "http://siris-libraries.si.edu/ipac20/ipac.jsp?&profile=all&source=~!silibraries&uri=full=3100001~!820431~!0#focus",
"items": [
{
"itemType": "book",
"creators": [
{
"lastName": "Pennsylvania Academy of the Fine Arts",
"fieldMode": true
},
{
"firstName": "Thomas",
"lastName": "Eakins",
"creatorType": "contributor"
},
{
"firstName": "Susan Macdowell",
"lastName": "Eakins",
"creatorType": "contributor"
},
{
"firstName": "Benjamin",
"lastName": "Eakins",
"creatorType": "contributor"
},
{
"firstName": "Charles",
"lastName": "Bregler",
"creatorType": "contributor"
},
{
"firstName": "Kathleen A",
"lastName": "Foster",
"creatorType": "contributor"
}
],
"notes": [],
"tags": [
"Eakins, Thomas",
"Eakins, Susan Macdowell",
"Eakins, Benjamin",
"Bregler, Charles",
"Bregler, Charles",
"Library",
"McDowell family",
"Manuscripts",
"Private collections",
"Pennsylvania Philadelphia"
],
"seeAlso": [],
"attachments": [
{
"url": false,
"title": "Original record",
"mimeType": "text/html",
"snapshot": false
}
],
"ISBN": "0812282248",
"title": "Charles Bregler's Thomas Eakins collection",
"place": "Philadelphia, PA",
"publisher": "University of Pennsylvania Press",
"date": "1989",
"numPages": "37",
"callNumber": "mfc 000652",
"libraryCatalog": "siris-libraries.si.edu Library Catalog"
}
]
}
]
/** END TEST CASES **/