Permalink
Join GitHub today
GitHub is home to over 36 million developers working together to host and review code, manage projects, and build software together.
Sign up
Fetching contributors…
Cannot retrieve contributors at this time
{ | |
"translatorID": "327cacea-9603-4554-91a8-ed0587e0d83a", | |
"label": "JISC Historical Texts", | |
"creator": "Sebastian Karcher", | |
"target": "^https?://(data.)?[^/]*historicaltexts\\.jisc\\.ac\\.uk/(view|results)\\?", | |
"minVersion": "4.0", | |
"maxVersion": "", | |
"priority": 100, | |
"inRepository": true, | |
"translatorType": 4, | |
"browserSupport": "gcsibv", | |
"lastUpdated": "2018-10-12 02:32:08" | |
} | |
/* | |
***** BEGIN LICENSE BLOCK ***** | |
Copyright © 2018 Sebastian Karcher | |
This file is part of Zotero. | |
Zotero is free software: you can redistribute it and/or modify | |
it under the terms of the GNU Affero General Public License as published by | |
the Free Software Foundation, either version 3 of the License, or | |
(at your option) any later version. | |
Zotero is distributed in the hope that it will be useful, | |
but WITHOUT ANY WARRANTY; without even the implied warranty of | |
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
GNU Affero General Public License for more details. | |
You should have received a copy of the GNU Affero General Public License | |
along with Zotero. If not, see <http://www.gnu.org/licenses/>. | |
***** END LICENSE BLOCK ***** | |
*/ | |
// attr()/text() v2 | |
function attr(docOrElem,selector,attr,index){var elem=index?docOrElem.querySelectorAll(selector).item(index):docOrElem.querySelector(selector);return elem?elem.getAttribute(attr):null;}function text(docOrElem,selector,index){var elem=index?docOrElem.querySelectorAll(selector).item(index):docOrElem.querySelector(selector);return elem?elem.textContent:null;} | |
function detectWeb(doc, url) { | |
if (url.includes('/view?')) { | |
return "book"; | |
} else if (url.includes("/results?terms")) { | |
// we don't use getSearchResults so we don't need the DOM object which loads after page load finishes | |
return "multiple"; | |
} | |
} | |
function getSearchResults(doc, checkOnly) { | |
var items = {}; | |
var found = false; | |
var rows = doc.querySelectorAll('a[class*="book-title"]'); | |
for (let i=0; i<rows.length; i++) { | |
let href = rows[i].href; | |
let title = ZU.trimInternal(rows[i].textContent); | |
if (!href || !title) continue; | |
if (checkOnly) return true; | |
found = true; | |
items[href] = title; | |
} | |
return found ? items : false; | |
} | |
function doWeb(doc, url) { | |
if (detectWeb(doc, url) == "multiple") { | |
Zotero.selectItems(getSearchResults(doc, false), function (items) { | |
if (!items) { | |
return true; | |
} | |
var articles = []; | |
for (var i in items) { | |
articles.push(i); | |
} | |
for (let article of articles) { | |
scrape(article); | |
} | |
}); | |
} else { | |
scrape(url); | |
} | |
} | |
function generateJSONUrl(url) { | |
let pubId = url.match(/pubId=([^&]+)/); | |
if (!pubId) return false; | |
else if (pubId[1].startsWith("ukmhl")) { | |
return "https://data.ukmhl.historicaltexts.jisc.ac.uk/elasticsearch/ukmhl/publication/" + pubId[1]; | |
} | |
else if (pubId[1].startsWith("bl-")) { | |
return "https://data.historicaltexts.jisc.ac.uk/elasticsearch/es1/ht/bl/publication/" + pubId[1]; | |
} | |
else if (pubId[1].startsWith("ecco-")) { | |
return "https://data.historicaltexts.jisc.ac.uk/elasticsearch/es1/ht/ecco/publication/" + pubId[1]; | |
} | |
else if (pubId[1].startsWith("eebo-")) { | |
return "https://data.historicaltexts.jisc.ac.uk/elasticsearch/es1/ht/eebo/publication/" + pubId[1]; | |
} | |
else return false; | |
} | |
function scrape(url) { | |
var JSONurl = generateJSONUrl(url); | |
if (!JSONurl) { | |
throw("Can't generate JSON ID"); | |
} | |
ZU.doGet(JSONurl, function(text){ | |
//Z.debug(text); | |
var data = JSON.parse(text); | |
if (data.hits && data.hits.hits.length) { | |
data = data.hits.hits[0]; | |
} | |
var creation = data._source.lifecycle.creation; | |
var publication = data._source.lifecycle.publication[0]; | |
var media = data._source.media[0]; | |
var item = new Zotero.Item("book"); | |
if (creation) { | |
var author = creation[0].author; | |
//Z.debug(author); | |
if (author) { | |
item.creators.push(ZU.cleanAuthor(author[0].name[0].value, "author", true)); | |
} | |
} | |
if (publication) { | |
if (publication.publisher) { | |
item.publisher = publication.publisher[0].name[0].value; | |
} | |
if (publication.place) { | |
item.place = publication.place[0].name[0].value; | |
} | |
if (publication.date) { | |
item.date = publication.date[0].value; | |
} | |
} | |
item.title= data._source.summary_title; | |
item.numPages = media.page_count; | |
if (data._source.edition) { | |
item.edition = data._source.edition[0].statement; | |
} | |
if (data._source.series) { | |
item.volume = data._source.series[0].volume; | |
} | |
var topics = data._source.subjects.topic; | |
if (topics) { | |
for (let topic of topics) { | |
item.tags.push(topic.name[0].value); | |
} | |
} | |
item.url = url.replace(/&.+/, ""); | |
var formats = media.format; | |
var pdfUrl; | |
for (let format of formats) { | |
if (format.type == "pdf") { | |
pdfUrl = "/media/pdf/" + format.location; | |
//Z.debug(pdfUrl); | |
break; | |
} | |
} | |
if (pdfUrl) { | |
item.attachments.push({url: pdfUrl, title: "Historical Text PDF", mimeType: "application/pdf"}); | |
} | |
item.complete(); | |
}); | |
} | |
/** BEGIN TEST CASES **/ | |
var testCases = [ | |
{ | |
"type": "web", | |
"url": "https://data.ukmhl.historicaltexts.jisc.ac.uk/view?pubId=ukmhl-b20392497&pageId=ukmhl-b20392497-1", | |
"items": [ | |
{ | |
"itemType": "book", | |
"title": "Test types for determining the acuteness of vision", | |
"creators": [ | |
{ | |
"firstName": "George", | |
"lastName": "Cowell", | |
"creatorType": "author" | |
} | |
], | |
"date": "189-?", | |
"libraryCatalog": "JISC Historical Texts", | |
"numPages": 4, | |
"place": "London", | |
"publisher": "Printed And Sold By Harrison And Sons", | |
"url": "https://data.ukmhl.historicaltexts.jisc.ac.uk/view?pubId=ukmhl-b20392497", | |
"attachments": [ | |
{ | |
"title": "Historical Text PDF", | |
"mimeType": "application/pdf" | |
} | |
], | |
"tags": [ | |
{ | |
"tag": "Vision Tests" | |
} | |
], | |
"notes": [], | |
"seeAlso": [] | |
} | |
] | |
}, | |
{ | |
"type": "web", | |
"url": "https://data.ukmhl.historicaltexts.jisc.ac.uk/view?pubId=ukmhl-b21304439_0003&pageId=ukmhl-b21304439_0003-1", | |
"items": [ | |
{ | |
"itemType": "book", | |
"title": "A compendium of the anatomy of the human body", | |
"creators": [ | |
{ | |
"firstName": "Andrew", | |
"lastName": "Fyfe", | |
"creatorType": "author" | |
} | |
], | |
"date": "1812-18", | |
"edition": "Fifth edition, enlarged and improved. To which is now added, a fourth volume, containing Outlines of comparative anatomy.", | |
"libraryCatalog": "JISC Historical Texts", | |
"numPages": 350, | |
"place": "Edinburgh", | |
"publisher": "Printed By J. Pillans & Sons For Adam Black ... Etc", | |
"url": "https://data.ukmhl.historicaltexts.jisc.ac.uk/view?pubId=ukmhl-b21304439_0003", | |
"volume": "3", | |
"attachments": [ | |
{ | |
"title": "Historical Text PDF", | |
"mimeType": "application/pdf" | |
} | |
], | |
"tags": [ | |
{ | |
"tag": "Anatomy" | |
}, | |
{ | |
"tag": "Anatomy, Comparative" | |
}, | |
{ | |
"tag": "Bones" | |
}, | |
{ | |
"tag": "Human anatomy" | |
}, | |
{ | |
"tag": "Ligaments" | |
}, | |
{ | |
"tag": "Muscles" | |
} | |
], | |
"notes": [], | |
"seeAlso": [] | |
} | |
] | |
} | |
] | |
/** END TEST CASES **/ |