Permalink
Join GitHub today
GitHub is home to over 36 million developers working together to host and review code, manage projects, and build software together.
Sign up
Fetching contributors…
Cannot retrieve contributors at this time
{ | |
"translatorID": "e4fe1596-a8c4-4d09-945f-120c4d83e580", | |
"label": "LA Times", | |
"creator": "Sebastian Karcher", | |
"target": "^https?://(www\\.|travel\\.|articles\\.|latimesblogs\\.)?latimes\\.com", | |
"minVersion": "2.1.9", | |
"maxVersion": "", | |
"priority": 100, | |
"inRepository": true, | |
"translatorType": 4, | |
"browserSupport": "gcsibv", | |
"lastUpdated": "2016-11-07 04:08:21" | |
} | |
/* FW LINE 59:b820c6d */ function flatten(t){var e=new Array;for(var i in t){var r=t[i];r instanceof Array?e=e.concat(flatten(r)):e.push(r)}return e}var FW={_scrapers:new Array};FW._Base=function(){this.callHook=function(t,e,i,r){if("object"==typeof this.hooks){var n=this.hooks[t];"function"==typeof n&&n(e,i,r)}},this.evaluateThing=function(t,e,i){var r=typeof t;if("object"===r){if(t instanceof Array){var n=this.evaluateThing,a=t.map(function(t){return n(t,e,i)});return flatten(a)}return t.evaluate(e,i)}return"function"===r?t(e,i):t},this.makeItems=function(t,e,i,r,n){n()}},FW.Scraper=function(t){FW._scrapers.push(new FW._Scraper(t))},FW._Scraper=function(t){for(x in t)this[x]=t[x];this._singleFieldNames=["abstractNote","applicationNumber","archive","archiveLocation","artworkMedium","artworkSize","assignee","audioFileType","audioRecordingType","billNumber","blogTitle","bookTitle","callNumber","caseName","code","codeNumber","codePages","codeVolume","committee","company","conferenceName","country","court","date","dateDecided","dateEnacted","dictionaryTitle","distributor","docketNumber","documentNumber","DOI","edition","encyclopediaTitle","episodeNumber","extra","filingDate","firstPage","forumTitle","genre","history","institution","interviewMedium","ISBN","ISSN","issue","issueDate","issuingAuthority","journalAbbreviation","label","language","legalStatus","legislativeBody","letterType","libraryCatalog","manuscriptType","mapType","medium","meetingName","nameOfAct","network","number","numberOfVolumes","numPages","pages","patentNumber","place","postType","presentationType","priorityNumbers","proceedingsTitle","programTitle","programmingLanguage","publicLawNumber","publicationTitle","publisher","references","reportNumber","reportType","reporter","reporterVolume","rights","runningTime","scale","section","series","seriesNumber","seriesText","seriesTitle","session","shortTitle","studio","subject","system","thesisType","title","type","university","url","version","videoRecordingType","volume","websiteTitle","websiteType"],this._makeAttachments=function(t,e,i,r){if(i instanceof Array)i.forEach(function(i){this._makeAttachments(t,e,i,r)},this);else if("object"==typeof i){var n=i.urls||i.url,a=i.types||i.type,s=i.titles||i.title,o=i.snapshots||i.snapshot,u=this.evaluateThing(n,t,e),l=this.evaluateThing(s,t,e),c=this.evaluateThing(a,t,e),h=this.evaluateThing(o,t,e);u instanceof Array||(u=[u]);for(var f in u){var p,m,v,d=u[f];p=c instanceof Array?c[f]:c,m=l instanceof Array?l[f]:l,v=h instanceof Array?h[f]:h,r.attachments.push({url:d,title:m,mimeType:p,snapshot:v})}}},this.makeItems=function(t,e,i,r,n){var a=new Zotero.Item(this.itemType);a.url=e;for(var s in this._singleFieldNames){var o=this._singleFieldNames[s];if(this[o]){var u=this.evaluateThing(this[o],t,e);u instanceof Array?a[o]=u[0]:a[o]=u}}var l=["creators","tags"];for(var c in l){var h=l[c],f=this.evaluateThing(this[h],t,e);if(f)for(var p in f)a[h].push(f[p])}this._makeAttachments(t,e,this.attachments,a),r(a,this,t,e),n()}},FW._Scraper.prototype=new FW._Base,FW.MultiScraper=function(t){FW._scrapers.push(new FW._MultiScraper(t))},FW._MultiScraper=function(t){for(x in t)this[x]=t[x];this._mkSelectItems=function(t,e){var i=new Object;for(var r in t)i[e[r]]=t[r];return i},this._selectItems=function(t,e,i){var r=new Array;Zotero.selectItems(this._mkSelectItems(t,e),function(t){for(var e in t)r.push(e);i(r)})},this._mkAttachments=function(t,e,i){var r=this.evaluateThing(this.attachments,t,e),n=new Object;if(r)for(var a in i)n[i[a]]=r[a];return n},this._makeChoices=function(t,e,i,r,n){if(t instanceof Array)t.forEach(function(t){this._makeTitlesUrls(t,e,i,r,n)},this);else if("object"==typeof t){var a=t.urls||t.url,s=t.titles||t.title,o=this.evaluateThing(a,e,i),u=this.evaluateThing(s,e,i),l=u instanceof Array;o instanceof Array||(o=[o]);for(var c in o){var h,f=o[c];h=l?u[c]:u,n.push(f),r.push(h)}}},this.makeItems=function(t,e,i,r,n){if(this.beforeFilter){var a=this.beforeFilter(t,e);if(a!=e)return void this.makeItems(t,a,i,r,n)}var s=[],o=[];this._makeChoices(this.choices,t,e,s,o);var u=this._mkAttachments(t,e,o),l=this.itemTrans;this._selectItems(s,o,function(t){if(t){var e=function(t){var e=t.documentURI,i=l;void 0===i&&(i=FW.getScraper(t,e)),void 0===i||i.makeItems(t,e,u[e],r,function(){})};Zotero.Utilities.processDocuments(t,e,n)}else n()})}},FW._MultiScraper.prototype=new FW._Base,FW.WebDelegateTranslator=function(t){return new FW._WebDelegateTranslator(t)},FW._WebDelegateTranslator=function(t){for(x in t)this[x]=t[x];this.makeItems=function(t,e,i,r,n){var a=this,s=Zotero.loadTranslator("web");s.setHandler("itemDone",function(i,n){r(n,a,t,e)}),s.setDocument(t),this.translatorId?(s.setTranslator(this.translatorId),s.translate()):(s.setHandler("translators",function(t,e){e.length&&(s.setTranslator(e[0]),s.translate())}),s.getTranslators()),n()}},FW._WebDelegateTranslator.prototype=new FW._Base,FW._StringMagic=function(){this._filters=new Array,this.addFilter=function(t){return this._filters.push(t),this},this.split=function(t){return this.addFilter(function(e){return e.split(t).filter(function(t){return""!=t})})},this.replace=function(t,e,i){return this.addFilter(function(r){return r.match(t)?r.replace(t,e,i):r})},this.prepend=function(t){return this.replace(/^/,t)},this.append=function(t){return this.replace(/$/,t)},this.remove=function(t,e){return this.replace(t,"",e)},this.trim=function(){return this.addFilter(function(t){return Zotero.Utilities.trim(t)})},this.trimInternal=function(){return this.addFilter(function(t){return Zotero.Utilities.trimInternal(t)})},this.match=function(t,e){return e||(e=0),this.addFilter(function(i){var r=i.match(t);return void 0===r||null===r?void 0:r[e]})},this.cleanAuthor=function(t,e){return this.addFilter(function(i){return Zotero.Utilities.cleanAuthor(i,t,e)})},this.key=function(t){return this.addFilter(function(e){return e[t]})},this.capitalizeTitle=function(){return this.addFilter(function(t){return Zotero.Utilities.capitalizeTitle(t)})},this.unescapeHTML=function(){return this.addFilter(function(t){return Zotero.Utilities.unescapeHTML(t)})},this.unescape=function(){return this.addFilter(function(t){return unescape(t)})},this._applyFilters=function(t,e){for(i in this._filters){t=flatten(t),t=t.filter(function(t){return void 0!==t&&null!==t});for(var r=0;r<t.length;r++)try{if(void 0===t[r]||null===t[r])continue;t[r]=this._filters[i](t[r],e)}catch(n){t[r]=void 0,Zotero.debug("Caught exception "+n+"on filter: "+this._filters[i])}t=t.filter(function(t){return void 0!==t&&null!==t})}return flatten(t)}},FW.PageText=function(){return new FW._PageText},FW._PageText=function(){this._filters=new Array,this.evaluate=function(t){var e=[t.documentElement.innerHTML];return e=this._applyFilters(e,t),0==e.length?!1:e}},FW._PageText.prototype=new FW._StringMagic,FW.Url=function(){return new FW._Url},FW._Url=function(){this._filters=new Array,this.evaluate=function(t,e){var i=[e];return i=this._applyFilters(i,t),0==i.length?!1:i}},FW._Url.prototype=new FW._StringMagic,FW.Xpath=function(t){return new FW._Xpath(t)},FW._Xpath=function(t){this._xpath=t,this._filters=new Array,this.text=function(){var t=function(t){return"object"==typeof t&&t.textContent?t.textContent:t};return this.addFilter(t),this},this.sub=function(t){var e=function(e,i){var r=i.evaluate(t,e,null,XPathResult.ANY_TYPE,null);return r?r.iterateNext():void 0};return this.addFilter(e),this},this.evaluate=function(t){var e=t.evaluate(this._xpath,t,null,XPathResult.ANY_TYPE,null),i=e.resultType,r=new Array;if(i==XPathResult.STRING_TYPE)r.push(e.stringValue);else if(i==XPathResult.BOOLEAN_TYPE)r.push(e.booleanValue);else if(i==XPathResult.NUMBER_TYPE)r.push(e.numberValue);else if(i==XPathResult.ORDERED_NODE_ITERATOR_TYPE||i==XPathResult.UNORDERED_NODE_ITERATOR_TYPE)for(var n;n=e.iterateNext();)r.push(n);return r=this._applyFilters(r,t),0==r.length?!1:r}},FW._Xpath.prototype=new FW._StringMagic,FW.detectWeb=function(t,e){for(var i in FW._scrapers){var r=FW._scrapers[i],n=r.evaluateThing(r.itemType,t,e),a=r.evaluateThing(r.detect,t,e);if(a.length>0&&a[0])return n}},FW.getScraper=function(t,e){var i=FW.detectWeb(t,e);return FW._scrapers.filter(function(r){return r.evaluateThing(r.itemType,t,e)==i&&r.evaluateThing(r.detect,t,e)})[0]},FW.doWeb=function(t,e){var i=FW.getScraper(t,e);i.makeItems(t,e,[],function(t,e,i,r){e.callHook("scraperDone",t,i,r),t.title||(t.title=""),t.complete()},function(){Zotero.done()}),Zotero.wait()}; | |
function detectWeb(doc, url) { return FW.detectWeb(doc, url); } | |
function doWeb(doc, url) { return FW.doWeb(doc, url); } | |
/* LA Times Translator | |
Copyright (C) 2012 Sebastian Karcher | |
This program is free software: you can redistribute it and/or modify | |
it under the terms of the GNU Affero General Public License as published by | |
the Free Software Foundation, either version 3 of the License, or | |
(at your option) any later version. | |
This program is distributed in the hope that it will be useful, | |
but WITHOUT ANY WARRANTY; without even the implied warranty of | |
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
GNU Affero General Public License for more details. | |
You should have received a copy of the GNU Affero General Public License | |
along with this program. If not, see <http://www.gnu.org/licenses/>. | |
*/ | |
/** Articles is this still used?*/ | |
FW.Scraper({ | |
itemType : 'newspaperArticle', | |
detect : FW.Xpath('//div[@class="story"]/h1'), | |
title : FW.Xpath('//div[@class="story"]/h1').text().trim(), | |
attachments : [{ url: FW.Url(), | |
title: "LA Times Snapshot", | |
type: "text/html" }], | |
creators : FW.Xpath('//span[@class="byline"]').text().replace(/By|,.+/g, "").split(/\s+and\s+/).cleanAuthor("author"), | |
date : FW.Xpath('//meta[@name="date"]/@content').text(), | |
abstractNote : FW.Xpath('//div[@class="story"]/h2').text().trim(), | |
language : FW.Xpath('//meta[@http-equiv="Content-Language"]/@content').text(), | |
ISSN : "0458-3035", | |
publicationTitle : "Los Angeles Times" | |
}); | |
/** Blog Posts */ | |
FW.Scraper({ | |
itemType : 'blogPost', | |
detect : FW.Url().match(/latimesblogs\..+\.html/), | |
title : FW.Xpath('//div[@class="entry"]/h1').text().trim(), | |
attachments : [{ url: FW.Url(), | |
title: "LA Times Snapshot", | |
type: "text/html" }], | |
creators : FW.Xpath('//span[@class="byline"]').text().replace(/By|,.+/g, "").split(/\s+and\s+/).cleanAuthor("author"), | |
date : FW.Xpath('//div[@class="time"]/text()').text().remove(/\|/).trim(), | |
language : "en-US", | |
publicationTitle : FW.Xpath('//div[@id="blog-header"]/h1').text().prepend("LA Times Blogs - ") | |
}); | |
/** Articles Format for articles.latimes.com*/ | |
FW.Scraper({ | |
itemType : 'newspaperArticle', | |
detect : FW.Xpath('//div[contains(@id, "article") or contains(@class, "article")]/h1'), | |
title : FW.Xpath('//div[contains(@id, "article") or contains(@class, "article")]/h1').text().trim(), | |
attachments : [{ url: FW.Url(), | |
title: "LA Times Snapshot", | |
type: "text/html" }], | |
creators : FW.Xpath('//div[contains(@id, "byline")]/span[3]|//div[contains(@class, "byline")]//span[@itemprop="author"]').text().replace(/By|,.+/g, "").split(/\s+and\s+/).cleanAuthor("author"), | |
date : FW.Xpath('//span[@class="pubdate"]/a|//div[@itemprop="datePublished"]/time/@datetime').text(), | |
abstractNote : FW.Xpath('//div[contains(@id, "subtitle")]/h2').text().trim(), | |
language : "en-US", | |
ISSN : "0458-3035", | |
publicationTitle : "Los Angeles Times" | |
}); | |
/**Article format using schema.org*/ | |
FW.Scraper({ | |
itemType : 'newspaperArticle', | |
detect : FW.Xpath('//article[@itemtype="http://schema.org/Article"]//h1[@itemprop="headline"]'), | |
title : FW.Xpath('//h1[@itemprop="headline"]').text().trim(), | |
attachments : [{ url: FW.Url(), | |
title: "LA Times Snapshot", | |
type: "text/html" }], | |
creators : FW.Xpath('//a[@itemprop="author"]').text().replace(/By|,.+/g, "").split(/\s+and\s+/).cleanAuthor("author"), | |
date : FW.Xpath('//time[@itemprop="datePublished"]/@datetime').text(), | |
abstractNote : FW.Xpath('//div[contains(@id, "subtitle")]/h2').text().trim(), | |
language : "en-US", | |
ISSN : "0458-3035", | |
publicationTitle : "Los Angeles Times" | |
}); | |
FW.MultiScraper({ | |
itemType : 'multiple', | |
detect : FW.Url().match(/\/search\//), | |
choices : { | |
titles : FW.Xpath('//div/a[@class="trb_search_result_title"]').text().trim(), | |
urls : FW.Xpath('//div/a[@class="trb_search_result_title"]').key("href") | |
} | |
}); | |
/** BEGIN TEST CASES **/ | |
var testCases = [ | |
{ | |
"type": "web", | |
"url": "http://articles.latimes.com/2012/apr/23/world/la-fg-argentina-oil-nationalize-20120424", | |
"items": [ | |
{ | |
"itemType": "newspaperArticle", | |
"title": "Argentina lawmakers expected to approve oil firm takeover", | |
"creators": [ | |
{ | |
"firstName": "Chris", | |
"lastName": "Kraul", | |
"creatorType": "author" | |
}, | |
{ | |
"firstName": "Andres", | |
"lastName": "d'Alessandro", | |
"creatorType": "author" | |
} | |
], | |
"date": "April 23, 2012", | |
"ISSN": "0458-3035", | |
"abstractNote": "Two polls show strong support for President Cristina Fernandez de Kirchner's proposal for the government to take a majority interest in YPF.", | |
"language": "en-US", | |
"libraryCatalog": "LA Times", | |
"publicationTitle": "Los Angeles Times", | |
"url": "http://articles.latimes.com/2012/apr/23/world/la-fg-argentina-oil-nationalize-20120424", | |
"attachments": [ | |
{ | |
"title": "LA Times Snapshot", | |
"mimeType": "text/html" | |
} | |
], | |
"tags": [], | |
"notes": [], | |
"seeAlso": [] | |
} | |
] | |
}, | |
{ | |
"type": "web", | |
"url": "http://latimesblogs.latimes.com/varsitytimesinsider/2013/06/football-edison-tournament-pairings-create-big-time-matchups.html", | |
"items": [ | |
{ | |
"itemType": "blogPost", | |
"title": "Football: Edison tournament pairings create big-time matchups", | |
"creators": [], | |
"date": "June 25, 2013", | |
"blogTitle": "LA Times Blogs - Varsity Times Insider", | |
"language": "en-US", | |
"shortTitle": "Football", | |
"url": "http://latimesblogs.latimes.com/varsitytimesinsider/2013/06/football-edison-tournament-pairings-create-big-time-matchups.html", | |
"attachments": [ | |
{ | |
"title": "LA Times Snapshot", | |
"mimeType": "text/html" | |
} | |
], | |
"tags": [], | |
"notes": [], | |
"seeAlso": [] | |
} | |
] | |
}, | |
{ | |
"type": "web", | |
"url": "http://www.latimes.com/sports/soccer/la-sp-us-world-cup-mls-20140601-story.html", | |
"items": [ | |
{ | |
"itemType": "newspaperArticle", | |
"title": "World Cup in 1994 gave U.S. soccer the kick in the pants it needed", | |
"creators": [ | |
{ | |
"firstName": "Kevin", | |
"lastName": "Baxter", | |
"creatorType": "author" | |
}, | |
{ | |
"firstName": "Lance", | |
"lastName": "Pugmire", | |
"creatorType": "author" | |
}, | |
{ | |
"firstName": "Sam", | |
"lastName": "Farmer", | |
"creatorType": "author" | |
}, | |
{ | |
"firstName": "John", | |
"lastName": "Cherwa", | |
"creatorType": "author" | |
}, | |
{ | |
"firstName": "Mike", | |
"lastName": "DiGiovanna", | |
"creatorType": "author" | |
}, | |
{ | |
"firstName": "Kevin", | |
"lastName": "Baxter", | |
"creatorType": "author" | |
} | |
], | |
"date": "2014-05-31T16:05:00PDT", | |
"ISSN": "0458-3035", | |
"language": "en-US", | |
"libraryCatalog": "LA Times", | |
"publicationTitle": "Los Angeles Times", | |
"url": "http://www.latimes.com/sports/soccer/la-sp-us-world-cup-mls-20140601-story.html", | |
"attachments": [ | |
{ | |
"title": "LA Times Snapshot", | |
"mimeType": "text/html" | |
} | |
], | |
"tags": [], | |
"notes": [], | |
"seeAlso": [] | |
} | |
] | |
}, | |
{ | |
"type": "web", | |
"url": "http://www.latimes.com/search/dispatcher.front?Query=argentina&target=all&isSearch=true&spell=on", | |
"items": "multiple" | |
} | |
] | |
/** END TEST CASES **/ |