Permalink
Join GitHub today
GitHub is home to over 31 million developers working together to host and review code, manage projects, and build software together.
Sign up
translators/JISC Historical Texts.js
Find file
Copy path
Fetching contributors…
Cannot retrieve contributors at this time
{ | |
"translatorID": "327cacea-9603-4554-91a8-ed0587e0d83a", | |
"label": "JISC Historical Texts", | |
"creator": "Sebastian Karcher", | |
"target": "^https?://(data.)?[^/]*historicaltexts\\.jisc\\.ac\\.uk/(view|results)\\?", | |
"minVersion": "4.0", | |
"maxVersion": "", | |
"priority": 100, | |
"inRepository": true, | |
"translatorType": 4, | |
"browserSupport": "gcsibv", | |
"lastUpdated": "2018-10-12 02:32:08" | |
} | |
/* | |
***** BEGIN LICENSE BLOCK ***** | |
Copyright © 2018 Sebastian Karcher | |
This file is part of Zotero. | |
Zotero is free software: you can redistribute it and/or modify | |
it under the terms of the GNU Affero General Public License as published by | |
the Free Software Foundation, either version 3 of the License, or | |
(at your option) any later version. | |
Zotero is distributed in the hope that it will be useful, | |
but WITHOUT ANY WARRANTY; without even the implied warranty of | |
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
GNU Affero General Public License for more details. | |
You should have received a copy of the GNU Affero General Public License | |
along with Zotero. If not, see <http://www.gnu.org/licenses/>. | |
***** END LICENSE BLOCK ***** | |
*/ | |
// attr()/text() v2 | |
function attr(docOrElem,selector,attr,index){var elem=index?docOrElem.querySelectorAll(selector).item(index):docOrElem.querySelector(selector);return elem?elem.getAttribute(attr):null;}function text(docOrElem,selector,index){var elem=index?docOrElem.querySelectorAll(selector).item(index):docOrElem.querySelector(selector);return elem?elem.textContent:null;} | |
function detectWeb(doc, url) { | |
if (url.includes('/view?')) { | |
return "book"; | |
} else if (url.includes("/results?terms")) { | |
// we don't use getSearchResults so we don't need the DOM object which loads after page load finishes | |
return "multiple"; | |
} | |
} | |
function getSearchResults(doc, checkOnly) { | |
var items = {}; | |
var found = false; | |
var rows = doc.querySelectorAll('a[class*="book-title"]'); | |
for (let i=0; i<rows.length; i++) { | |
let href = rows[i].href; | |
let title = ZU.trimInternal(rows[i].textContent); | |
if (!href || !title) continue; | |
if (checkOnly) return true; | |
found = true; | |
items[href] = title; | |
} | |
return found ? items : false; | |
} | |
function doWeb(doc, url) { | |
if (detectWeb(doc, url) == "multiple") { | |
Zotero.selectItems(getSearchResults(doc, false), function (items) { | |
if (!items) { | |
return true; | |
} | |
var articles = []; | |
for (var i in items) { | |
articles.push(i); | |
} | |
for (let article of articles) { | |
scrape(article); | |
} | |
}); | |
} else { | |
scrape(url); | |
} | |
} | |
function generateJSONUrl(url) { | |
let pubId = url.match(/pubId=([^&]+)/); | |
if (!pubId) return false; | |
else if (pubId[1].startsWith("ukmhl")) { | |
return "https://data.ukmhl.historicaltexts.jisc.ac.uk/elasticsearch/ukmhl/publication/" + pubId[1]; | |
} | |
else if (pubId[1].startsWith("bl-")) { | |
return "https://data.historicaltexts.jisc.ac.uk/elasticsearch/es1/ht/bl/publication/" + pubId[1]; | |
} | |
else if (pubId[1].startsWith("ecco-")) { | |
return "https://data.historicaltexts.jisc.ac.uk/elasticsearch/es1/ht/ecco/publication/" + pubId[1]; | |
} | |
else if (pubId[1].startsWith("eebo-")) { | |
return "https://data.historicaltexts.jisc.ac.uk/elasticsearch/es1/ht/eebo/publication/" + pubId[1]; | |
} | |
else return false; | |
} | |
function scrape(url) { | |
var JSONurl = generateJSONUrl(url); | |
if (!JSONurl) { | |
throw("Can't generate JSON ID"); | |
} | |
ZU.doGet(JSONurl, function(text){ | |
//Z.debug(text); | |
var data = JSON.parse(text); | |
if (data.hits && data.hits.hits.length) { | |
data = data.hits.hits[0]; | |
} | |
var creation = data._source.lifecycle.creation; | |
var publication = data._source.lifecycle.publication[0]; | |
var media = data._source.media[0]; | |
var item = new Zotero.Item("book"); | |
if (creation) { | |
var author = creation[0].author; | |
//Z.debug(author); | |
if (author) { | |
item.creators.push(ZU.cleanAuthor(author[0].name[0].value, "author", true)); | |
} | |
} | |
if (publication) { | |
if (publication.publisher) { | |
item.publisher = publication.publisher[0].name[0].value; | |
} | |
if (publication.place) { | |
item.place = publication.place[0].name[0].value; | |
} | |
if (publication.date) { | |
item.date = publication.date[0].value; | |
} | |
} | |
item.title= data._source.summary_title; | |
item.numPages = media.page_count; | |
if (data._source.edition) { | |
item.edition = data._source.edition[0].statement; | |
} | |
if (data._source.series) { | |
item.volume = data._source.series[0].volume; | |
} | |
var topics = data._source.subjects.topic; | |
if (topics) { | |
for (let topic of topics) { | |
item.tags.push(topic.name[0].value); | |
} | |
} | |
item.url = url.replace(/&.+/, ""); | |
var formats = media.format; | |
var pdfUrl; | |
for (let format of formats) { | |
if (format.type == "pdf") { | |
pdfUrl = "/media/pdf/" + format.location; | |
//Z.debug(pdfUrl); | |
break; | |
} | |
} | |
if (pdfUrl) { | |
item.attachments.push({url: pdfUrl, title: "Historical Text PDF", mimeType: "application/pdf"}); | |
} | |
item.complete(); | |
}); | |
} | |
/** BEGIN TEST CASES **/ | |
var testCases = [ | |
{ | |
"type": "web", | |
"url": "https://data.ukmhl.historicaltexts.jisc.ac.uk/view?pubId=ukmhl-b20392497&pageId=ukmhl-b20392497-1", | |
"items": [ | |
{ | |
"itemType": "book", | |
"title": "Test types for determining the acuteness of vision", | |
"creators": [ | |
{ | |
"firstName": "George", | |
"lastName": "Cowell", | |
"creatorType": "author" | |
} | |
], | |
"date": "189-?", | |
"libraryCatalog": "JISC Historical Texts", | |
"numPages": 4, | |
"place": "London", | |
"publisher": "Printed And Sold By Harrison And Sons", | |
"url": "https://data.ukmhl.historicaltexts.jisc.ac.uk/view?pubId=ukmhl-b20392497", | |
"attachments": [ | |
{ | |
"title": "Historical Text PDF", | |
"mimeType": "application/pdf" | |
} | |
], | |
"tags": [ | |
{ | |
"tag": "Vision Tests" | |
} | |
], | |
"notes": [], | |
"seeAlso": [] | |
} | |
] | |
}, | |
{ | |
"type": "web", | |
"url": "https://data.ukmhl.historicaltexts.jisc.ac.uk/view?pubId=ukmhl-b21304439_0003&pageId=ukmhl-b21304439_0003-1", | |
"items": [ | |
{ | |
"itemType": "book", | |
"title": "A compendium of the anatomy of the human body", | |
"creators": [ | |
{ | |
"firstName": "Andrew", | |
"lastName": "Fyfe", | |
"creatorType": "author" | |
} | |
], | |
"date": "1812-18", | |
"edition": "Fifth edition, enlarged and improved. To which is now added, a fourth volume, containing Outlines of comparative anatomy.", | |
"libraryCatalog": "JISC Historical Texts", | |
"numPages": 350, | |
"place": "Edinburgh", | |
"publisher": "Printed By J. Pillans & Sons For Adam Black ... Etc", | |
"url": "https://data.ukmhl.historicaltexts.jisc.ac.uk/view?pubId=ukmhl-b21304439_0003", | |
"volume": "3", | |
"attachments": [ | |
{ | |
"title": "Historical Text PDF", | |
"mimeType": "application/pdf" | |
} | |
], | |
"tags": [ | |
{ | |
"tag": "Anatomy" | |
}, | |
{ | |
"tag": "Anatomy, Comparative" | |
}, | |
{ | |
"tag": "Bones" | |
}, | |
{ | |
"tag": "Human anatomy" | |
}, | |
{ | |
"tag": "Ligaments" | |
}, | |
{ | |
"tag": "Muscles" | |
} | |
], | |
"notes": [], | |
"seeAlso": [] | |
} | |
] | |
} | |
] | |
/** END TEST CASES **/ |