zotero/translators/JSTOR.js

216 lines
6.3 KiB
JavaScript
Raw Normal View History

{
"translatorID":"d921155f-0186-1684-615c-ca57682ced9b",
"label":"JSTOR",
"creator":"Simon Kornblith, Sean Takats, Michael Berkowitz, and Eli Osherovich",
"target":"https?://[^/]*jstor\\.org[^/]*/(action/(showArticle|doBasicSearch|doAdvancedSearch|doLocatorSearch|doAdvancedResults|doBasicResults)|stable/|pss/)",
"minVersion":"1.0.0b4.r1",
"maxVersion":"",
"priority":100,
"inRepository":"1",
"translatorType":4,
"lastUpdated":"2011-01-12 19:22:04"
}
2009-01-12 03:55:55 +00:00
function detectWeb(doc, url) {
2009-01-14 17:33:14 +00:00
var namespace = doc.documentElement.namespaceURI;
var nsResolver = namespace ? function(prefix) {
2009-01-12 03:55:55 +00:00
if (prefix == 'x') return namespace; else return null;
2009-01-14 17:33:14 +00:00
} : null;
2009-01-14 17:33:14 +00:00
// See if this is a seach results page or Issue content
if (doc.title == "JSTOR: Search Results" || url.match(/\/i\d+/) ||
(url.match(/stable|pss/) // Issues with DOIs can't be identified by URL
&& doc.evaluate('//form[@id="toc"]', doc, nsResolver,
XPathResult.FIRST_ORDERED_NODE_TYPE, null).singleNodeValue)
) {
return "multiple";
2009-01-14 17:33:14 +00:00
} else if(url.indexOf("/search/") != -1) {
return false;
2009-01-14 17:33:14 +00:00
}
2009-01-14 17:33:14 +00:00
// If this is a view page, find the link to the citation
var xpath = '//a[@id="favorites"]';
var elmt = doc.evaluate(xpath, doc, nsResolver, XPathResult.FIRST_ORDERED_NODE_TYPE, null).singleNodeValue;
if(elmt || url.match(/pss/)) {
2009-01-12 03:55:55 +00:00
return "journalArticle";
2009-01-14 17:33:14 +00:00
}
}
2009-08-19 22:10:19 +00:00
Zotero.Utilities.processAsync = function (sets, callbacks, onDone) {
var currentSet;
var index = 0;
var nextSet = function () {
if (!sets.length) {
onDone();
return;
}
index = 0;
currentSet = sets.shift();
callbacks[0](currentSet, nextCallback);
};
var nextCallback = function () {
index++;
callbacks[index](currentSet, nextCallback);
};
// Add a final callback to proceed to the next set
callbacks[callbacks.length] = function () {
nextSet();
}
nextSet();
}
function doWeb(doc, url) {
2009-01-14 17:33:14 +00:00
var namespace = doc.documentElement.namespaceURI;
var nsResolver = namespace ? function(prefix) {
2009-01-12 03:55:55 +00:00
if (prefix == 'x') return namespace; else return null;
2009-01-14 17:33:14 +00:00
} : null;
2009-01-14 17:33:14 +00:00
var host = doc.location.host;
// If this is a view page, find the link to the citation
var xpath = '//a[@id="favorites"]';
var elmt = doc.evaluate(xpath, doc, nsResolver, XPathResult.FIRST_ORDERED_NODE_TYPE, null).singleNodeValue;
var allJids = new Array();
if (elmt && /jid=10\.2307%2F(\d+)/.test(elmt.href)) {
2009-01-12 03:55:55 +00:00
allJids.push(RegExp.$1);
2009-08-19 22:10:19 +00:00
var jid = RegExp.$1;
2009-01-12 03:55:55 +00:00
Zotero.debug("JID found 1 " + jid);
2009-01-14 17:33:14 +00:00
}
// Sometimes JSTOR uses DOIs as JID; here we exclude "?" characters, since it's a URL
// And exclude TOC for journal issues that have their own DOI
else if (/(?:pss|stable)\/(10\.\d+\/.+)(?:\?.*)?/.test(url)
&& !doc.evaluate('//form[@id="toc"]', doc, nsResolver,
XPathResult.FIRST_ORDERED_NODE_TYPE, null).singleNodeValue) {
Zotero.debug("URL " + url);
jid = RegExp.$1;
allJids.push(jid);
Zotero.debug("JID found 2 " + jid);
}
else if (/(?:pss|stable)\/(\d+)/.test(url)
&& !doc.evaluate('//form[@id="toc"]', doc, nsResolver,
XPathResult.FIRST_ORDERED_NODE_TYPE, null).singleNodeValue) {
2009-01-12 03:55:55 +00:00
Zotero.debug("URL " + url);
2009-08-19 22:10:19 +00:00
jid = RegExp.$1;
allJids.push(jid);
2009-01-12 03:55:55 +00:00
Zotero.debug("JID found 2 " + jid);
2009-01-14 17:33:14 +00:00
}
else {
2009-01-12 03:55:55 +00:00
// We have multiple results
var resultsBlock = doc.evaluate('//fieldset[@id="results"]', doc, nsResolver, XPathResult.FIRST_ORDERED_NODE_TYPE, null).singleNodeValue;
if (! resultsBlock) {
2009-01-14 17:33:14 +00:00
return true;
2009-01-12 03:55:55 +00:00
}
var allTitlesElmts = doc.evaluate('//li//a[@class="title"]', resultsBlock, nsResolver, XPathResult.ANY_TYPE, null);
2009-01-12 03:55:55 +00:00
var currTitleElmt;
var availableItems = new Object();
while (currTitleElmt = allTitlesElmts.iterateNext()) {
2009-01-14 17:33:14 +00:00
var title = currTitleElmt.textContent;
// Sometimes JSTOR uses DOIs as JID; here we exclude "?" characters, since it's a URL
if (/(?:pss|stable)\/(10\.\d+\/.+)(?:\?.*)?/.test(currTitleElmt.href))
var jid = RegExp.$1;
else
var jid = currTitleElmt.href.match(/(?:stable|pss)\/([a-z]*?\d+)/)[1];
2009-01-14 17:33:14 +00:00
if (jid) {
availableItems[jid] = title;
2009-01-14 17:33:14 +00:00
}
Zotero.debug("Found title " + title+jid);
2009-01-12 03:55:55 +00:00
}
Zotero.debug("End of titles");
2009-01-12 03:55:55 +00:00
var selectedItems = Zotero.selectItems(availableItems);
if (!selectedItems) {
2009-01-14 17:33:14 +00:00
return true;
}
2009-01-12 03:55:55 +00:00
for (var j in selectedItems) {
2009-01-14 17:33:14 +00:00
Zotero.debug("Pushing " + j);
allJids.push(j);
2009-01-12 03:55:55 +00:00
}
2009-01-14 17:33:14 +00:00
}
2009-08-19 22:10:19 +00:00
var sets = [];
for each(var jid in allJids) {
sets.push({ jid: jid });
}
function first(set, next) {
var jid = set.jid;
var downloadString = "suffix=" + jid;
Zotero.Utilities.HTTP.doPost("http://"+host+"/action/downloadSingleCitation?format=refman&direct=true&singleCitation=true", downloadString, function(text) {
// load translator for RIS
var translator = Zotero.loadTranslator("import");
translator.setTranslator("32d59d2d-b65a-4da4-b0a3-bdd3cfb979e7");
translator.setString(text);
translator.setHandler("itemDone", function(obj, item) {
if(item.notes && item.notes[0]) {
// For some reason JSTOR exports abstract with 'AB' tag istead of 'N1'
item.abstractNote = item.notes[0].note;
delete item.notes;
item.notes = undefined;
}
2009-01-14 17:33:14 +00:00
2009-08-19 22:10:19 +00:00
// Don't save HTML snapshot from 'UR' tag
item.attachments = [];
2009-01-14 17:33:14 +00:00
2009-08-19 22:10:19 +00:00
set.doi = "10.2307/" + jid;
2009-08-19 22:10:19 +00:00
if (/stable\/(\d+)/.test(item.url)) {
2010-08-22 06:34:41 +00:00
var pdfurl = "http://"+ host + "/stable/pdfplus/" + jid + ".pdf?acceptTC=true";
2009-08-19 22:10:19 +00:00
item.attachments.push({url:pdfurl, title:"JSTOR Full Text PDF", mimeType:"application/pdf"});
}
set.item = item;
next();
2009-01-14 17:33:14 +00:00
});
2009-08-19 22:10:19 +00:00
translator.translate();
2009-01-14 17:33:14 +00:00
});
}
2009-08-19 22:10:19 +00:00
function second(set, next) {
var item = set.item;
if (!set.doi) {
item.complete();
next();
}
var doi = set.doi;
var crossrefURL = "http://www.crossref.org/openurl/?req_dat=zter:zter321&url_ver=Z39.88-2004&ctx_ver=Z39.88-2004&rft_id=info%3Adoi/"+doi+"&noredirect=true&format=unixref";
Zotero.Utilities.HTTP.doGet(crossrefURL, function (text) {
text = text.replace(/<\?xml[^>]*\?>/, "");
// parse XML with E4X
try {
2009-08-19 22:10:19 +00:00
var xml = new XML(text);
} catch(e) {
2009-08-19 22:10:19 +00:00
item.complete();
next();
return;
}
var doi = xml..doi.toString();
// ensure DOI is valid
if(!xml..error.length()) {
2009-08-19 22:10:19 +00:00
Zotero.debug("DOI is valid");
item.DOI = doi;
}
2009-08-19 22:10:19 +00:00
item.complete();
next();
});
}
2009-08-19 22:10:19 +00:00
var callbacks = [first, second];
Zotero.Utilities.processAsync(sets, callbacks, function () { Zotero.done(); });
Zotero.wait();
}