Initial Commit
This commit is contained in:
327
translators/Galegroup.js
Normal file
327
translators/Galegroup.js
Normal file
@@ -0,0 +1,327 @@
|
||||
{
|
||||
"translatorID": "4ea89035-3dc4-4ae3-b22d-726bc0d83a64",
|
||||
"label": "Galegroup",
|
||||
"creator": "Sebastian Karcher and Aurimas Vinckevicius",
|
||||
"target": "^https?://(find\\.galegroup\\.com/|go\\.galegroup\\.com/gdsc)",
|
||||
"minVersion": "3.0",
|
||||
"maxVersion": "",
|
||||
"priority": 100,
|
||||
"inRepository": true,
|
||||
"translatorType": 4,
|
||||
"browserSupport": "gcsibv",
|
||||
"lastUpdated": "2018-10-07 16:06:56"
|
||||
}
|
||||
|
||||
/*
|
||||
***** BEGIN LICENSE BLOCK *****
|
||||
|
||||
Galegroup Translator - Copyright © 2012-2018 Sebastian Karcher
|
||||
This file is part of Zotero.
|
||||
|
||||
Zotero is free software: you can redistribute it and/or modify
|
||||
it under the terms of the GNU Affero General Public License as published by
|
||||
the Free Software Foundation, either version 3 of the License, or
|
||||
(at your option) any later version.
|
||||
|
||||
Zotero is distributed in the hope that it will be useful,
|
||||
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
GNU Affero General Public License for more details.
|
||||
|
||||
You should have received a copy of the GNU Affero General Public License
|
||||
along with Zotero. If not, see <http://www.gnu.org/licenses/>.
|
||||
|
||||
***** END LICENSE BLOCK *****
|
||||
*/
|
||||
|
||||
var composeAttachment = composeAttachmentDefault;
|
||||
var composeRisUrl = composeRisUrlDefault;
|
||||
|
||||
function getSearchResults(doc) {
|
||||
// Default
|
||||
var results = ZU.xpath(doc, '//*[@id="SearchResults"]//section[@class="resultsBody"]/ul/li');
|
||||
if (results.length) {
|
||||
results.linkXPath = './p[@class="subTitle"]/a';
|
||||
Z.debug("Default Layout");
|
||||
return results;
|
||||
}
|
||||
|
||||
// Ecco
|
||||
results = ZU.xpath(doc, '//div[@id="resultsBox"]//li[@class="resrow"]');
|
||||
if (results.length) {
|
||||
results.linkXPath = './/div[@class="pic_Title"]/a';
|
||||
Z.debug("Ecco, but using Default");
|
||||
return results;
|
||||
}
|
||||
|
||||
// Time Literary Supplement & Times Digital Archive
|
||||
results = ZU.xpath(doc, '//div[@id="results_list"]/ul[@class="resultsListBox"]');
|
||||
if (results.length) {
|
||||
results.linkXPath = './/p[@class="articleTitle"]//a';
|
||||
if (doc.title.includes("The Times Digital Archive")) {
|
||||
Z.debug("Times Digital Archive");
|
||||
composeRisUrl = composeRisUrlTDA;
|
||||
}
|
||||
else {
|
||||
composeRisUrl = composeRisUrlGNV;
|
||||
Z.debug("TLS, but using GNV/TDA combo");
|
||||
}
|
||||
composeAttachment = composeAttachmentTDA;
|
||||
|
||||
return results;
|
||||
}
|
||||
|
||||
|
||||
// Archives Unbound
|
||||
results = ZU.xpath(doc, '//div[@id="resultsTable"]/div');
|
||||
if (results.length) {
|
||||
results.linkXPath = './/span[@class="title"]//a';
|
||||
Z.debug("Archives Unbound, but using Default");
|
||||
return results;
|
||||
}
|
||||
|
||||
// Gale NewsVault
|
||||
results = ZU.xpath(doc, '//*[@id="results_list"]/div[contains(@class,"resultList")]');
|
||||
if (results.length) {
|
||||
results.linkXPath = './div[@class="pub_details"]//li[@class="resultInfo"]/p//a';
|
||||
Z.debug("Using GNV");
|
||||
composeAttachment = composeAttachmentGNV;
|
||||
composeRisUrl = composeRisUrlGNV;
|
||||
return results;
|
||||
}
|
||||
|
||||
// LegalTrac (not sure this still exists 2018-09-24)
|
||||
results = ZU.xpath(doc, '//*[@id="sr_ul"]/li');
|
||||
if (results.length) {
|
||||
results.linkXPath = './/span[@class="title"]/a';
|
||||
Z.debug("LegalTrac, but using Default");
|
||||
return results;
|
||||
}
|
||||
|
||||
return [];
|
||||
}
|
||||
|
||||
function detectWeb(doc, url) {
|
||||
if (url.includes('/newspaperRetrieve.do')) {
|
||||
return "newspaperArticle";
|
||||
}
|
||||
|
||||
if (url.includes('/retrieve.do') || url.includes('/i.do') || url.includes('/infomark.do')) {
|
||||
if (url.includes('/ecco/')) return "book";
|
||||
else if (url.includes('prodId=TLSH') || url.includes('prodID=TTDA') || url.includes('prodID=DVNW')) {
|
||||
return "newspaperArticle";
|
||||
}
|
||||
return "journalArticle";
|
||||
}
|
||||
|
||||
if (getSearchResults(doc).length) return "multiple";
|
||||
}
|
||||
|
||||
|
||||
|
||||
function composeRisUrlGNV(url) {
|
||||
let baseUrl = url.replace(/#.*/,'').replace(/\/[^\/?]+\?.+/, '/centralizedGenerateCitation.do?');
|
||||
let userGroupName = url.match(/userGroupName=[^&]+/)[0];
|
||||
let prodId = url.match(/prodId=[^&]+/)[0];
|
||||
let tabID = url.match(/tabID=[^&]+/)[0];
|
||||
let docId = url.match(/docId=[^&]+/);
|
||||
if (docId) {
|
||||
docId = docId[0];
|
||||
}
|
||||
else {
|
||||
docId = url.match(/relevancePageBatch=[^&]+/)[0].replace(/relevancePageBatch/, "docId");
|
||||
}
|
||||
let contentSet= url.match(/contentSet=[^&]+/)[0];
|
||||
return baseUrl + "actionString=FormatCitation&inPS=true&citationFormat=ENDNOTE" + "&" + userGroupName + "&" + contentSet +"&" + docId + "&" + prodId + "&" + tabID;
|
||||
|
||||
}
|
||||
|
||||
function composeRisUrlDefault(url) {
|
||||
return url.replace(/#.*/,'').replace(/\/[^\/?]+(?=\?|$)/, '/generateCitation.do')
|
||||
.replace(/\bactionString=[^&]*&?/g, '').replace(/\bcitationFormat=[^&]*&?/g, '')
|
||||
.replace(/\&u=/, "&userGroupName=").replace(/\&id=/, "&docId=") //for bookmarked pages
|
||||
+ '&actionString=FormatCitation&citationFormat=ENDNOTE';
|
||||
}
|
||||
|
||||
// The Times Digital Archive
|
||||
function composeRisUrlTDA(url) {
|
||||
if (url.indexOf('relevancePageBatch=') != -1) {
|
||||
url = url.replace(/\bdocId=[^&]*&?/g, "").replace(/\&relevancePageBatch=/, "&docId=");
|
||||
}
|
||||
return url.replace(/#.*/,'').replace(/\/[^\/?]+(?=\?|$)/, '/generateCitation.do')
|
||||
.replace(/\bactionString=[^&]*&?/g, '').replace(/\bcitationFormat=[^&]*&?/g, '')
|
||||
+ '&actionString=FormatCitation&citationFormat=ENDNOTE';
|
||||
}
|
||||
|
||||
|
||||
|
||||
function composeAttachmentDefault(doc, url) {
|
||||
var pdf = !!(doc.getElementById('pdfLink') || doc.getElementById('docTools-pdf'));
|
||||
var attachment = ZU.xpath(doc, '//*[@id="docTools-download"]/a[./@href]')[0];
|
||||
if (attachment && pdf ) {
|
||||
url = attachment.href;
|
||||
return {
|
||||
url: url.replace(/#.*/, '').replace(/\/[^\/?]+(?=\?|$)/, '/downloadDocument.do')
|
||||
.replace(/\b(?:actionCmd|downloadFormat)=[^&]*&?/g, '')
|
||||
+ '&actionCmd=DO_DOWNLOAD_DOCUMENT&downloadFormat=' + (pdf?'PDF':'HTML'),
|
||||
title: "Full Text " + (pdf?'PDF':'HTML'),
|
||||
mimeType: pdf?'application/pdf':'text/html'
|
||||
};
|
||||
} else {
|
||||
return {document: doc, title: "Snapshot"};
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
|
||||
function composeAttachmentGNV(doc, url) {
|
||||
var lowerLimit = ZU.xpathText(doc, '//form[@id="resultsForm"]/input[@name="pdfLowerLimit"]/@value') || '1';
|
||||
var upperLimit = ZU.xpathText(doc, '//form[@id="resultsForm"]/input[@name="pdfHigherLimit"]/@value') || lowerLimit;
|
||||
var numPages = ZU.xpathText(doc, '//form[@id="resultsForm"]/input[@name="noOfPages"]/@value') || (upperLimit - lowerLimit + 1);
|
||||
var pdfUrl = url.replace(/#.*/,'').replace(/\/[^\/?]+(?=\?|$)/, '/downloadDocument.do')
|
||||
.replace(/\b(?:scale|orientation|docType|pageIndex|relatedDocId|isIllustration|imageId|aCmnd|recNum|pageRange|noOfPages)=[^&]*&?/g, '')
|
||||
+ '&scale=&orientation=&docType=&pageIndex=1&relatedDocId=&isIllustration=false'
|
||||
+ '&imageId=&aCmnd=PDFFormat&recNum=&' + 'noOfPages=' + numPages + '&pageRange=' + lowerLimit + '-' + upperLimit;
|
||||
|
||||
Z.debug(pdfUrl);
|
||||
return {
|
||||
url: pdfUrl,
|
||||
title: 'Full Text PDF',
|
||||
mimeType: 'application/pdf'
|
||||
};
|
||||
}
|
||||
|
||||
function composeAttachmentTDA(doc, url) {
|
||||
if (url.indexOf('relevancePageBatch=') != -1) {
|
||||
url = url.replace(/\bdocId=[^&]*&?/g, "").replace(/\&relevancePageBatch=/, "&docId=");
|
||||
}
|
||||
return composeAttachmentGNV(doc, url);
|
||||
}
|
||||
|
||||
function parseRis(text, attachment) {
|
||||
text = text.trim();
|
||||
// gale puts issue numbers in M1
|
||||
text = text.replace(/M1\s*\-/g, "IS -");
|
||||
// L2 is probably meant to be UR, but we can ignore it altogether
|
||||
text = text.replace(/^L2\s+-.+\n/gm, '');
|
||||
// we can map copyright notes via CR
|
||||
text = text.replace(/^N1(?=\s+-\s+copyright)/igm, 'CR');
|
||||
// Z.debug(text);
|
||||
|
||||
var translator = Zotero.loadTranslator("import");
|
||||
translator.setTranslator("32d59d2d-b65a-4da4-b0a3-bdd3cfb979e7");
|
||||
translator.setString(text);
|
||||
translator.setHandler("itemDone", function (obj, item) {
|
||||
if (attachment) item.attachments.push(attachment);
|
||||
if (item.ISSN) {
|
||||
item.ISSN = ZU.cleanISSN(item.ISSN);
|
||||
}
|
||||
if (item.pages && item.pages.endsWith("+")) {
|
||||
item.pages = item.pages.replace(/\+/, "-");
|
||||
}
|
||||
item.complete();
|
||||
});
|
||||
translator.translate();
|
||||
}
|
||||
|
||||
function processArticles(articles) {
|
||||
var article;
|
||||
while (article = articles.shift()) {
|
||||
ZU.processDocuments(article, function(doc, url) {
|
||||
processPage(doc, url);
|
||||
processArticles(articles);
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
function processPage(doc, url) {
|
||||
var attachment = composeAttachment(doc, url);
|
||||
Z.debug(composeRisUrl(url))
|
||||
ZU.doGet(composeRisUrl(url), function(text) {
|
||||
parseRis(text, attachment);
|
||||
});
|
||||
}
|
||||
|
||||
function doWeb(doc, url) {
|
||||
if (detectWeb(doc, url) == "multiple") {
|
||||
var results = getSearchResults(doc);
|
||||
var items = {};
|
||||
for (var i=0, n=results.length; i<n; i++) {
|
||||
var link = ZU.xpath(results[i], results.linkXPath)[0];
|
||||
if (!link) continue;
|
||||
|
||||
items[link.href] = ZU.trimInternal(link.textContent);
|
||||
}
|
||||
|
||||
Zotero.selectItems(items, function (items) {
|
||||
if (!items) return true;
|
||||
|
||||
var articles = [];
|
||||
for (var i in items) {
|
||||
articles.push(i);
|
||||
}
|
||||
processArticles(articles);
|
||||
});
|
||||
} else {
|
||||
if (doc.title.includes('NewsVault')) {
|
||||
Z.debug("Using GNV");
|
||||
composeAttachment = composeAttachmentGNV;
|
||||
composeRisUrl = composeRisUrlGNV;
|
||||
} else if (doc.title.includes('Times Literary Supplement')) {
|
||||
Z.debug("Times Literary Supplment Using GNV/TDA");
|
||||
composeAttachment = composeAttachmentTDA;
|
||||
composeRisUrl = composeRisUrlGNV;
|
||||
|
||||
} else if (doc.title.includes('The Times Digital Archive')) {
|
||||
Z.debug("Using TDA");
|
||||
composeAttachment = composeAttachmentTDA;
|
||||
composeRisUrl = composeRisUrlTDA;
|
||||
} else if (doc.title.includes('Eighteenth Century Collections Online')) {
|
||||
Z.debug("Using Ecco (Default)");
|
||||
// keeping this separate as there is a different attachment logic
|
||||
// we might want to use that in the future.
|
||||
} else {
|
||||
Z.debug("Using Default");
|
||||
}
|
||||
|
||||
processPage(doc, url);
|
||||
}
|
||||
}
|
||||
|
||||
/** BEGIN TEST CASES **/
|
||||
var testCases = [
|
||||
{
|
||||
"type": "web",
|
||||
"url": "http://find.galegroup.com/tlsh/infomark.do?&source=gale&prodId=TLSH&userGroupName=nysl_ce_syr&tabID=T003&docPage=article&searchType=&docId=EX1200180081&type=multipage&contentSet=LTO&version=1.0",
|
||||
"items": [
|
||||
{
|
||||
"itemType": "newspaperArticle",
|
||||
"title": "Science in 1901",
|
||||
"creators": [
|
||||
{
|
||||
"lastName": "Ross",
|
||||
"firstName": "Hugh Munro",
|
||||
"creatorType": "author"
|
||||
}
|
||||
],
|
||||
"date": "January 17, 1902",
|
||||
"archive": "Times Literary Supplement Historical Archive",
|
||||
"libraryCatalog": "Gale",
|
||||
"pages": "5+",
|
||||
"place": "London, England",
|
||||
"publicationTitle": "The Times Literary Supplement",
|
||||
"url": "http://find.galegroup.com/tlsh/infomark.do?&source=gale&prodId=TLSH&userGroupName=nysl_ce_syr&tabID=T003&docPage=article&searchType=&docId=EX1200180081&type=multipage&contentSet=LTO&version=1.0",
|
||||
"attachments": [
|
||||
{
|
||||
"title": "Full Text PDF",
|
||||
"mimeType": "application/pdf"
|
||||
}
|
||||
],
|
||||
"tags": [],
|
||||
"notes": [],
|
||||
"seeAlso": []
|
||||
}
|
||||
]
|
||||
}
|
||||
]
|
||||
/** END TEST CASES **/
|
||||
Reference in New Issue
Block a user