closes #269, For some COinS pages "could not save item" error
This commit is contained in:
parent
0ab9e8b36c
commit
e5404f4938
|
@ -415,7 +415,7 @@ Scholar.OpenURL = new function() {
|
||||||
item.creators.push({firstName:value});
|
item.creators.push({firstName:value});
|
||||||
}
|
}
|
||||||
} else if(key == "rft.au") {
|
} else if(key == "rft.au") {
|
||||||
item.creators.push(Scholar.cleanAuthor(value, "author", true));
|
item.creators.push(Scholar.Utilities.prototype.cleanAuthor(value, "author", true));
|
||||||
} else if(key == "rft.aucorp") {
|
} else if(key == "rft.aucorp") {
|
||||||
item.creators.push({lastName:value, institutional:true});
|
item.creators.push({lastName:value, institutional:true});
|
||||||
} else if(key == "rft.isbn" && !item.ISBN) {
|
} else if(key == "rft.isbn" && !item.ISBN) {
|
||||||
|
|
81
scrapers.sql
81
scrapers.sql
|
@ -1,4 +1,4 @@
|
||||||
-- 73
|
-- 74
|
||||||
|
|
||||||
-- Set the following timestamp to the most recent scraper update date
|
-- Set the following timestamp to the most recent scraper update date
|
||||||
REPLACE INTO "version" VALUES ('repository', STRFTIME('%s', '2006-08-31 22:44:00'));
|
REPLACE INTO "version" VALUES ('repository', STRFTIME('%s', '2006-08-31 22:44:00'));
|
||||||
|
@ -2792,7 +2792,7 @@ REPLACE INTO "translators" VALUES ('05d07af9-105a-4572-99f6-a8e231c0daef', '2006
|
||||||
}',
|
}',
|
||||||
'// used to retrieve next COinS object when asynchronously parsing COinS objects
|
'// used to retrieve next COinS object when asynchronously parsing COinS objects
|
||||||
// on a page
|
// on a page
|
||||||
function retrieveNextCOinS(needFullItems, newItems, doc) {
|
function retrieveNextCOinS(needFullItems, newItems, couldUseFullItems, doc) {
|
||||||
if(needFullItems.length) {
|
if(needFullItems.length) {
|
||||||
var item = needFullItems.shift();
|
var item = needFullItems.shift();
|
||||||
|
|
||||||
|
@ -2802,26 +2802,26 @@ function retrieveNextCOinS(needFullItems, newItems, doc) {
|
||||||
newItems.push(item);
|
newItems.push(item);
|
||||||
});
|
});
|
||||||
search.setHandler("done", function() {
|
search.setHandler("done", function() {
|
||||||
retrieveNextCOinS(needFullItems, newItems, doc);
|
retrieveNextCOinS(needFullItems, newItems, couldUseFullItems, doc);
|
||||||
});
|
});
|
||||||
search.setSearch(item);
|
search.setSearch(item);
|
||||||
|
|
||||||
// look for translators
|
// look for translators
|
||||||
var translators = search.getTranslators();
|
var translators = search.getTranslators();
|
||||||
if(translators) {
|
if(translators.length) {
|
||||||
search.setTranslator(translators);
|
search.setTranslator(translators);
|
||||||
search.translate();
|
search.translate();
|
||||||
} else {
|
} else {
|
||||||
retrieveNextCOinS(needFullItems, newItems, doc);
|
retrieveNextCOinS(needFullItems, newItems, couldUseFullItems, doc);
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
completeCOinS(newItems, doc);
|
completeCOinS(newItems, couldUseFullItems, doc);
|
||||||
Scholar.done(true);
|
Scholar.done(true);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// saves all COinS objects
|
// saves all COinS objects
|
||||||
function completeCOinS(newItems, doc) {
|
function completeCOinS(newItems, couldUseFullItems, doc) {
|
||||||
if(newItems.length > 1) {
|
if(newItems.length > 1) {
|
||||||
var selectArray = new Array();
|
var selectArray = new Array();
|
||||||
|
|
||||||
|
@ -2829,21 +2829,67 @@ function completeCOinS(newItems, doc) {
|
||||||
selectArray[i] = newItems[i].title;
|
selectArray[i] = newItems[i].title;
|
||||||
}
|
}
|
||||||
selectArray = Scholar.selectItems(selectArray);
|
selectArray = Scholar.selectItems(selectArray);
|
||||||
|
|
||||||
|
var useIndices = new Array();
|
||||||
for(var i in selectArray) {
|
for(var i in selectArray) {
|
||||||
|
useIndices.push(i);
|
||||||
|
}
|
||||||
|
completeItems(newItems, useIndices, couldUseFullItems);
|
||||||
|
} else if(newItems.length) {
|
||||||
|
completeItems(newItems, [0], couldUseFullItems);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
function completeItems(newItems, useIndices, couldUseFullItems, doc) {
|
||||||
|
if(!useIndices.length) {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
var i = useIndices.shift();
|
||||||
|
|
||||||
|
// grab full item if requested
|
||||||
|
if(couldUseFullItems[i]) {
|
||||||
|
Scholar.Utilities.debug("looking up contextObject");
|
||||||
|
var search = Scholar.loadTranslator("search");
|
||||||
|
|
||||||
|
var firstItem = false;
|
||||||
|
search.setHandler("itemDone", function(obj, newItem) {
|
||||||
|
if(!firstItem) {
|
||||||
|
// add doc as attachment
|
||||||
|
newItem.attachments.push({document:doc});
|
||||||
|
newItem.complete();
|
||||||
|
firstItem = true;
|
||||||
|
}
|
||||||
|
});
|
||||||
|
search.setHandler("done", function(obj) {
|
||||||
|
// call next
|
||||||
|
completeItems(newItems, useIndices, couldUseFullItems);
|
||||||
|
});
|
||||||
|
|
||||||
|
search.setSearch(newItems[i]);
|
||||||
|
var translators = search.getTranslators();
|
||||||
|
if(translators.length) {
|
||||||
|
search.setTranslator(translators);
|
||||||
|
search.translate();
|
||||||
|
} else {
|
||||||
// add doc as attachment
|
// add doc as attachment
|
||||||
newItems[i].attachments.push({document:doc});
|
newItems[i].attachments.push({document:doc});
|
||||||
|
|
||||||
newItems[i].complete();
|
newItems[i].complete();
|
||||||
|
// call next
|
||||||
|
completeItems(newItems, useIndices, couldUseFullItems);
|
||||||
}
|
}
|
||||||
} else if(newItems.length) {
|
} else {
|
||||||
newItems[0].attachments.push({document:doc});
|
// add doc as attachment
|
||||||
newItems[0].complete();
|
newItems[i].attachments.push({document:doc});
|
||||||
|
newItems[i].complete();
|
||||||
|
// call next
|
||||||
|
completeItems(newItems, useIndices, couldUseFullItems);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
function doWeb(doc, url) {
|
function doWeb(doc, url) {
|
||||||
var newItems = new Array();
|
var newItems = new Array();
|
||||||
var needFullItems = new Array();
|
var needFullItems = new Array();
|
||||||
|
var couldUseFullItems = new Array();
|
||||||
|
|
||||||
var spanTags = doc.getElementsByTagName("span");
|
var spanTags = doc.getElementsByTagName("span");
|
||||||
|
|
||||||
|
@ -2855,7 +2901,13 @@ function doWeb(doc, url) {
|
||||||
var spanTitle = spanTags[i].getAttribute("title");
|
var spanTitle = spanTags[i].getAttribute("title");
|
||||||
var newItem = new Scholar.Item();
|
var newItem = new Scholar.Item();
|
||||||
if(Scholar.Utilities.parseContextObject(spanTitle, newItem)) {
|
if(Scholar.Utilities.parseContextObject(spanTitle, newItem)) {
|
||||||
if(newItem.title && newItem.creators.length) {
|
if(newItem.title) {
|
||||||
|
if(!newItem.creators.length) {
|
||||||
|
// if we have a title but little other identifying
|
||||||
|
// information, say we''ll get full item later
|
||||||
|
couldUseFullItems[newItems.length] = true;
|
||||||
|
}
|
||||||
|
|
||||||
// title and creators are minimum data to avoid looking up
|
// title and creators are minimum data to avoid looking up
|
||||||
newItems.push(newItem);
|
newItems.push(newItem);
|
||||||
} else {
|
} else {
|
||||||
|
@ -2868,12 +2920,13 @@ function doWeb(doc, url) {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Scholar.Utilities.debug(needFullItems);
|
||||||
if(needFullItems.length) {
|
if(needFullItems.length) {
|
||||||
// retrieve full items asynchronously
|
// retrieve full items asynchronously
|
||||||
Scholar.wait();
|
Scholar.wait();
|
||||||
retrieveNextCOinS(needFullItems, newItems, doc);
|
retrieveNextCOinS(needFullItems, newItems, couldUseFullItems, doc);
|
||||||
} else {
|
} else {
|
||||||
completeCOinS(newItems, doc);
|
completeCOinS(newItems, couldUseFullItems, doc);
|
||||||
}
|
}
|
||||||
}');
|
}');
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue
Block a user