diff --git a/translators/Frontiers.js b/translators/Frontiers.js new file mode 100644 index 000000000..627af9076 --- /dev/null +++ b/translators/Frontiers.js @@ -0,0 +1,285 @@ +{ + "translatorID":"cb9e794e-7a65-47cd-90f6-58cdd191e8b0", + "label":"Frontiers", + "creator":"Jason Friedman", + "target":"^http://www.frontiersin.org.*/", + "minVersion":"1.0", + "maxVersion":"", + "priority":100, + "inRepository":"1", + "translatorType":4, + "lastUpdated":"2010-12-28 23:21:54" +} + +/* + Frontiers translator + Copyright (C) 2009-2010 Jason Friedman, write.to.jason@gmail.com + + This program is free software: you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation, either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program. If not, see . +*/ + +function detectWeb(doc, url) { + + if (url.indexOf("abstract") != -1) { + return "journalArticle"; + } + else if (url.indexOf("full") != -1) { + return "journalArticle"; + } + else if (url.indexOf("SearchSite") != -1) { + return "multiple"; + } + // other pages on the site may contain articles + else + return "multiple"; + + +} + +function doWeb(doc, url) { + var articles = new Array(); + + // individual article + if (url.indexOf("abstract") != -1) { + // For some strange reason, replacing /abstract with /pdf/abstract will load a document that has a link to the pdf . . . + if (!url.match(/pdf/) && url.match(/abstract$/)) { + url = url.replace('abstract','pdf/abstract'); + } + articles = [url]; + + Zotero.Utilities.processDocuments(articles, scrape, function() {Zotero.done();}); + Zotero.wait(); + } + else if(url.indexOf("full")!= -1) { + // For some strange reason, replacing /abstract with /pdf/abstract will load a document that has a link to the pdf . . . + if (!url.match(/pdf/) && url.match(/full$/)) { + url = url.replace('full','pdf/full'); + } + articles = [url]; + + Zotero.Utilities.processDocuments(articles, scrape, function() {Zotero.done();}); + Zotero.wait(); + } + // search results / other page + else { + var namespace = doc.documentElement.namespaceURI; + var nsResolver = namespace ? function(prefix) { + if (prefix == 'x') return namespace; else return null; + } : null; + + var items = new Object(); + var noitems = 1; + + var links = doc.evaluate('//div[@class="ArchiveList"]/div/p/a', doc, nsResolver, XPathResult.ANY_TYPE, null); + while (link = links.iterateNext()) { + var url = link.href; + if (url.indexOf("abstract")!= -1) { + if(url.match(/abstract$/)) + url = url.replace('abstract','pdf/abstract'); + items[url] = link.textContent; + noitems=0; + } + else if (url.indexOf("full")!= -1) { + if(url.match(/full$/)) + url = url.replace('full','pdf/full'); + items[url] = link.textContent; + noitems=0; + } + + } + + + var links = doc.evaluate('//div/div/h4/a', doc, nsResolver, XPathResult.ANY_TYPE, null); + while (link = links.iterateNext()) { + var url = link.href; + if (url.indexOf("abstract")!= -1) { + if(url.match(/abstract$/)) + url = url.replace('abstract','pdf/abstract'); + items[url] = link.textContent; + noitems=0; + } + else if (url.indexOf("full")!= -1) { + if(url.match(/full$/)) + url = url.replace('full','pdf/full'); + items[url] = link.textContent; + noitems=0; + } + } + + if (noitems) + return true; + + items = Zotero.selectItems(items); + + for (var i in items) { + articles.push(i); + } + + if (!items) + return true; + + Zotero.Utilities.processDocuments(articles, scrape, function() {Zotero.done();}); + Zotero.wait(); + } +} + +function scrape(doc,url) { + var namespace = doc.documentElement.namespaceURI; + var nsResolver = namespace ? function(prefix) { + if (prefix == 'x') return namespace; else return null; + } : null; + + var newItem = new Zotero.Item("journalArticle"); + + // save the url + newItem.url = doc.location.href; + + //title + var title1 = doc.evaluate('//div[@class="JournalAbstract"]/h1', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext(); + + if (title1==null) + title1 = doc.evaluate('//div[@class="JournalAbstract"]/div/h1', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext(); + + newItem.title = Zotero.Utilities.trim(title1.textContent); + + // journal name + var docTitle = doc.evaluate('//head/title', doc, nsResolver, XPathResult.ANY_TYPE, null).iterateNext().textContent; + newItem.publicationTitle = Zotero.Utilities.trimInternal(docTitle.split('|')[2]); + + //authors - can be in two ways, depending on which page + var authors = doc.evaluate('//div[@class="authors"]/a', doc, nsResolver, XPathResult.ANY_TYPE,null); + while (author = authors.iterateNext()) { + newItem.creators.push(Zotero.Utilities.cleanAuthor(Zotero.Utilities.trimInternal(author.textContent),"author")); + } + + authors = doc.evaluate('//div[@class="paperauthor"]/a',doc,nsResolver,XPathResult.ANY_TYPE,null); + + while (author = authors.iterateNext()) { + newItem.creators.push(Zotero.Utilities.cleanAuthor(Zotero.Utilities.trimInternal(author.textContent),"author")); + } + + // abstract + var abstract1; + abstract1 = doc.evaluate('//div[@class="JournalAbstract"]/p',doc,nsResolver,XPathResult.ANY_TYPE,null).iterateNext(); + + if (abstract1==null) + abstract1 = doc.evaluate('//div[@class="JournalAbstract"]/div[@class="abstracttext"]',doc,nsResolver,XPathResult.ANY_TYPE,null).iterateNext(); + + if (!(abstract1==null)) + newItem.abstractNote = Zotero.Utilities.trim(abstract1.textContent); + + // Get volume, DOI, pages and year from the citation. It can appear in various places + + var citation1 = doc.evaluate('//div[@class="AbstractSummary"]/p[2]',doc,nsResolver,XPathResult.ANY_TYPE,null).iterateNext(2); + if (citation1!=null) { + if (!citation1.textContent.match(/Citation:/)) + citation1 = null; + } + + if (citation1==null) { + citation1 = doc.evaluate('//div[@class="AbstractSummary"]/p[1]',doc,nsResolver,XPathResult.ANY_TYPE,null).iterateNext(); + if (citation1!=null) { + if (!citation1.textContent.match(/Citation:/)) + citation1 = null; + } + } + + if (citation1==null) { + citation1 = doc.evaluate('//div[@class="metacontainer"]/div[@class="metavalue"][2]',doc,nsResolver,XPathResult.ANY_TYPE,null).iterateNext(2); + if (citation1!=null) { + if (!doc.evaluate('//div[@class="metacontainer"]/div[@class="metakey"][2]',doc,nsResolver,XPathResult.ANY_TYPE,null).iterateNext(2).textContent.match(/Citation:/)) + citation1 = null; + } + } + + if (citation1==null) + citation1 = doc.evaluate('//div[@class="AbstractSummary"]/p',doc,nsResolver,XPathResult.ANY_TYPE,null).iterateNext(2); + + if (citation1.textContent.match(/Received/)) + citation1 = doc.evaluate('//div[@class="metacontainer"]/div[@class="metavalue"]',doc,nsResolver,XPathResult.ANY_TYPE,null).iterateNext(); + + var citation = citation1.textContent; + + if (!(citation==null)) { + // DOI + var doipart = citation.split('doi:')[1]; + if (doipart!=null) + newItem.DOI = Zotero.Utilities.trim(doipart); + var citation2 = citation.match(/:([0-9]*)\./); + // If it has been recently released, there may be no page number + if (citation2!=null) + newItem.pages = citation2[1]; + var citation3 = citation.match(/\((20[0-9][0-9])\)/); + if(citation3!=null) + newItem.date = citation3[1]; + } + + // Look for keywords + var keywords1 = doc.evaluate('//div[@class="AbstractSummary"]/p[1]',doc,nsResolver,XPathResult.ANY_TYPE,null).iterateNext(); + if (keywords1!=null) { + if (!(keywords1.textContent.match(/Keywords/))) + keywords1 = null; + } + var withoutKeywordsColon = 0; + + if (keywords1==null) { + // In these articles, "Keyword:" appears inside a separate div + keywords1 = doc.evaluate('//div[@class="metacontainer"]/div[@class="metavalue"][1]',doc,nsResolver,XPathResult.ANY_TYPE,null).iterateNext(); + withoutKeywordsColon = 1; + } + + if (keywords1 != null) { + + var keywords = keywords1.textContent; + + if(!(keywords == null)) { + var keywordspart = "a,b"; + if (withoutKeywordsColon) + keywordspart = keywords; + else + keywordspart = Zotero.Utilities.trim(keywords.split('Keywords:')[1]); + var keywordsall = keywordspart.split(','); + for (i=0; i