275 lines
7.8 KiB
JavaScript
275 lines
7.8 KiB
JavaScript
|
{
|
|||
|
"translatorID": "82b534ea-abf0-4527-9d5d-48cd98a89ba5",
|
|||
|
"label": "Sacramento Bee",
|
|||
|
"creator": "czar",
|
|||
|
"target": "^https?://(www\\.)?sacbee\\.com",
|
|||
|
"minVersion": "3.0",
|
|||
|
"maxVersion": "",
|
|||
|
"priority": 100,
|
|||
|
"inRepository": true,
|
|||
|
"translatorType": 4,
|
|||
|
"browserSupport": "gcsibv",
|
|||
|
"lastUpdated": "2017-07-09 05:05:18"
|
|||
|
}
|
|||
|
|
|||
|
/*
|
|||
|
***** BEGIN LICENSE BLOCK *****
|
|||
|
|
|||
|
Copyright © 2017 czar
|
|||
|
http://en.wikipedia.org/wiki/User_talk:Czar
|
|||
|
|
|||
|
This file is part of Zotero.
|
|||
|
|
|||
|
Zotero is free software: you can redistribute it and/or modify
|
|||
|
it under the terms of the GNU Affero General Public License as published by
|
|||
|
the Free Software Foundation, either version 3 of the License, or
|
|||
|
(at your option) any later version.
|
|||
|
|
|||
|
Zotero is distributed in the hope that it will be useful,
|
|||
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|||
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|||
|
GNU Affero General Public License for more details.
|
|||
|
|
|||
|
You should have received a copy of the GNU Affero General Public License
|
|||
|
along with Zotero. If not, see <http://www.gnu.org/licenses/>.
|
|||
|
|
|||
|
***** END LICENSE BLOCK *****
|
|||
|
*/
|
|||
|
|
|||
|
// attr()/text()
|
|||
|
function attr(doc,selector,attr,index){if(index>0){var elem=doc.querySelectorAll(selector).item(index);return elem?elem.getAttribute(attr):null}var elem=doc.querySelector(selector);return elem?elem.getAttribute(attr):null}function text(doc,selector,index){if(index>0){var elem=doc.querySelectorAll(selector).item(index);return elem?elem.textContent:null}var elem=doc.querySelector(selector);return elem?elem.textContent:null}
|
|||
|
|
|||
|
function detectWeb(doc, url) {
|
|||
|
if (/article\d+/.test(url)) {
|
|||
|
return "newspaperArticle";
|
|||
|
} else if (/(\/((news|sports|entertainment)\/)|(search\/\?q=))|sacbee\.com\/?$/.test(url) && getSearchResults(doc, true) ) {
|
|||
|
return "multiple";
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
function scrape(doc, url) {
|
|||
|
var item = new Zotero.Item("newspaperArticle");
|
|||
|
item.publicationTitle = "The Sacramento Bee";
|
|||
|
item.language = "en-US";
|
|||
|
item.ISSN = "0890-5738";
|
|||
|
item.url = url;
|
|||
|
item.title = attr(doc,'[property="og:title"]','content');
|
|||
|
item.date = text(doc,'.published-date');
|
|||
|
if (item.date) { // don't perform on empty string
|
|||
|
item.date = ZU.strToISO(item.date);
|
|||
|
}
|
|||
|
item.abstractNote = text(doc,'#content-body- p');
|
|||
|
var keywords = attr(doc,'meta[name="keywords"]','content');
|
|||
|
if (keywords) { // so as not to perform a split when keyword string is null
|
|||
|
item.tags = keywords.split(", ");
|
|||
|
}
|
|||
|
item.attachments.push({
|
|||
|
title: "The Sacramento Bee Snapshot",
|
|||
|
mimeType: "text/html",
|
|||
|
document: doc
|
|||
|
});
|
|||
|
|
|||
|
// Authors
|
|||
|
var authorMetadata = doc.querySelectorAll('.ng_byline_name');
|
|||
|
if (authorMetadata.length) { // querySelectorAll always retuns a NodeList, so test against length instead
|
|||
|
// when authors are split between multiple selectors, combine them
|
|||
|
var authorString = '';
|
|||
|
for (i=0; i < authorMetadata.length; i++) {
|
|||
|
authorString = authorString.concat(' '+authorMetadata[i].textContent);
|
|||
|
}
|
|||
|
authorString = authorString.replace('By ','').split(" and ");
|
|||
|
do {
|
|||
|
item.creators.push(ZU.cleanAuthor(authorString[0], "author"));
|
|||
|
authorString.shift();
|
|||
|
}
|
|||
|
while (authorString.length);
|
|||
|
}
|
|||
|
|
|||
|
item.complete();
|
|||
|
}
|
|||
|
|
|||
|
function getSearchResults(doc, checkOnly) {
|
|||
|
var items = {};
|
|||
|
var found = false;
|
|||
|
var rows = doc.querySelectorAll('#site-search-results .title a, .media-body .title a, #story-list .title a, .col-sm-7 .title a');
|
|||
|
for (var i=0; i<rows.length; i++) {
|
|||
|
var href = rows[i].href;
|
|||
|
var title = ZU.trimInternal(rows[i].textContent);
|
|||
|
if (!href || !title) continue;
|
|||
|
if (checkOnly) return true;
|
|||
|
found = true;
|
|||
|
items[href] = title;
|
|||
|
}
|
|||
|
return found ? items : false;
|
|||
|
}
|
|||
|
|
|||
|
function doWeb(doc, url) {
|
|||
|
if (detectWeb(doc, url) == "multiple") {
|
|||
|
Zotero.selectItems(getSearchResults(doc, false), function (items) {
|
|||
|
if (!items) {
|
|||
|
return true;
|
|||
|
}
|
|||
|
var articles = [];
|
|||
|
for (var i in items) {
|
|||
|
articles.push(i);
|
|||
|
}
|
|||
|
ZU.processDocuments(articles, scrape);
|
|||
|
});
|
|||
|
} else scrape(doc, url);
|
|||
|
}/** BEGIN TEST CASES **/
|
|||
|
var testCases = [
|
|||
|
{
|
|||
|
"type": "web",
|
|||
|
"url": "http://www.sacbee.com/news/local/crime/article5641188.html",
|
|||
|
"items": [
|
|||
|
{
|
|||
|
"itemType": "newspaperArticle",
|
|||
|
"title": "Convicted ‘eco-terrorist’ freed amid claims FBI hid evidence",
|
|||
|
"creators": [
|
|||
|
{
|
|||
|
"firstName": "Denny",
|
|||
|
"lastName": "Walsh",
|
|||
|
"creatorType": "author"
|
|||
|
},
|
|||
|
{
|
|||
|
"firstName": "Sam",
|
|||
|
"lastName": "Stanton",
|
|||
|
"creatorType": "author"
|
|||
|
}
|
|||
|
],
|
|||
|
"date": "2015-01-08",
|
|||
|
"ISSN": "0890-5738",
|
|||
|
"abstractNote": "Until this week, the federal government officially considered Eric Taylor McDavid a threat to the nation, a radical eco-terrorist who plotted to bomb or torch the Nimbus Dam, a U.S. Forest Service lab and cellphone towers in the Sacramento region.",
|
|||
|
"language": "en-US",
|
|||
|
"libraryCatalog": "Sacramento Bee",
|
|||
|
"publicationTitle": "The Sacramento Bee",
|
|||
|
"url": "http://www.sacbee.com/news/local/crime/article5641188.html",
|
|||
|
"attachments": [
|
|||
|
{
|
|||
|
"title": "The Sacramento Bee Snapshot",
|
|||
|
"mimeType": "text/html"
|
|||
|
}
|
|||
|
],
|
|||
|
"tags": [
|
|||
|
"Eric McDavid",
|
|||
|
"FBI",
|
|||
|
"eco-terrorism",
|
|||
|
"entrapment",
|
|||
|
"federal courthouse",
|
|||
|
"nimbus dam",
|
|||
|
"prison",
|
|||
|
"release",
|
|||
|
"sacramento"
|
|||
|
],
|
|||
|
"notes": [],
|
|||
|
"seeAlso": []
|
|||
|
}
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"type": "web",
|
|||
|
"url": "http://www.sacbee.com/news/local/article7251650.html",
|
|||
|
"items": [
|
|||
|
{
|
|||
|
"itemType": "newspaperArticle",
|
|||
|
"title": "After nine years in prison, accused eco-terrorist adjusts to sudden release",
|
|||
|
"creators": [
|
|||
|
{
|
|||
|
"firstName": "Denny",
|
|||
|
"lastName": "Walsh",
|
|||
|
"creatorType": "author"
|
|||
|
},
|
|||
|
{
|
|||
|
"firstName": "Sam",
|
|||
|
"lastName": "Stanton",
|
|||
|
"creatorType": "author"
|
|||
|
}
|
|||
|
],
|
|||
|
"date": "2015-01-17",
|
|||
|
"ISSN": "0890-5738",
|
|||
|
"abstractNote": "Eric McDavid was running late for his interview Wednesday, unavoidably delayed when a detective asked to chat with him after he stopped at the Placer County Sheriff’s Office to register as an arsonist.",
|
|||
|
"language": "en-US",
|
|||
|
"libraryCatalog": "Sacramento Bee",
|
|||
|
"publicationTitle": "The Sacramento Bee",
|
|||
|
"url": "http://www.sacbee.com/news/local/article7251650.html",
|
|||
|
"attachments": [
|
|||
|
{
|
|||
|
"title": "The Sacramento Bee Snapshot",
|
|||
|
"mimeType": "text/html"
|
|||
|
}
|
|||
|
],
|
|||
|
"tags": [
|
|||
|
"Benjamin Wagner",
|
|||
|
"Eric McDavid",
|
|||
|
"Lauren Weiner",
|
|||
|
"McGregor Scott",
|
|||
|
"Zachary Johnson",
|
|||
|
"conspiracy",
|
|||
|
"eco-terrorism",
|
|||
|
"eco-terrorist"
|
|||
|
],
|
|||
|
"notes": [],
|
|||
|
"seeAlso": []
|
|||
|
}
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"type": "web",
|
|||
|
"url": "http://www.sacbee.com/entertainment/living/home-garden/article159629689.html",
|
|||
|
"items": [
|
|||
|
{
|
|||
|
"itemType": "newspaperArticle",
|
|||
|
"title": "Want a giant pumpkin? Plant seed now",
|
|||
|
"creators": [
|
|||
|
{
|
|||
|
"firstName": "Debbie",
|
|||
|
"lastName": "Arrington",
|
|||
|
"creatorType": "author"
|
|||
|
}
|
|||
|
],
|
|||
|
"date": "2017-07-07",
|
|||
|
"ISSN": "0890-5738",
|
|||
|
"abstractNote": "Shortly after Independence Day fireworks, it’s time to start thinking about another holiday – Halloween.",
|
|||
|
"language": "en-US",
|
|||
|
"libraryCatalog": "Sacramento Bee",
|
|||
|
"publicationTitle": "The Sacramento Bee",
|
|||
|
"shortTitle": "Want a giant pumpkin?",
|
|||
|
"url": "http://www.sacbee.com/entertainment/living/home-garden/article159629689.html",
|
|||
|
"attachments": [
|
|||
|
{
|
|||
|
"title": "The Sacramento Bee Snapshot",
|
|||
|
"mimeType": "text/html"
|
|||
|
}
|
|||
|
],
|
|||
|
"tags": [
|
|||
|
"dill's atlantic giant",
|
|||
|
"garden",
|
|||
|
"halloween",
|
|||
|
"july",
|
|||
|
"pumpkins",
|
|||
|
"what to plant",
|
|||
|
"world record pumpkin"
|
|||
|
],
|
|||
|
"notes": [],
|
|||
|
"seeAlso": []
|
|||
|
}
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"type": "web",
|
|||
|
"url": "http://www.sacbee.com/search/?q=mcdavid",
|
|||
|
"items": "multiple"
|
|||
|
},
|
|||
|
{
|
|||
|
"type": "web",
|
|||
|
"url": "http://www.sacbee.com/sports/",
|
|||
|
"items": "multiple"
|
|||
|
},
|
|||
|
{
|
|||
|
"type": "web",
|
|||
|
"url": "http://www.sacbee.com/sports/nfl/san-francisco-49ers/",
|
|||
|
"items": "multiple"
|
|||
|
}
|
|||
|
]
|
|||
|
/** END TEST CASES **/
|