zotero/translators/UNZ Print Archive.js

277 lines
6.6 KiB
JavaScript

{
"translatorID": "0754db60-3ad1-49e0-8e3f-f4e1210c756c",
"label": "UNZ Print Archive",
"creator": "czar",
"target": "^https?://(www\\.)?unz\\.com/print",
"minVersion": "3.0",
"maxVersion": "",
"priority": 100,
"inRepository": true,
"translatorType": 4,
"browserSupport": "gcsibv",
"lastUpdated": "2021-07-23 03:39:49"
}
/*
***** BEGIN LICENSE BLOCK *****
Copyright © 2018 czar
http://en.wikipedia.org/wiki/User_talk:Czar
This file is part of Zotero.
Zotero is free software: you can redistribute it and/or modify
it under the terms of the GNU Affero General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
Zotero is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU Affero General Public License for more details.
You should have received a copy of the GNU Affero General Public License
along with Zotero. If not, see <http://www.gnu.org/licenses/>.
***** END LICENSE BLOCK *****
*/
function detectWeb(doc, url) {
if (/\/print\/.*-\d{5}/.test(url)) {
return "magazineArticle";
} else if (getSearchResults(doc, true, url)) {
return "multiple";
}
}
function scrape(doc, url) {
var item = new Zotero.Item("magazineArticle");
item.libraryCatalog = "UNZ";
item.title = text('.block .head');
var authorMetadata = doc.querySelectorAll('#pub-heading .byline a');
for (let author of authorMetadata) {
item.creators.push(ZU.cleanAuthor(author.textContent, "author"));
}
var subhead = text('#pub-heading .subhead');
if (subhead) {
var reviewedAuthor = subhead.replace(/.*\sby\s(.*)/,'$1');
item.creators.push(Zotero.Utilities.cleanAuthor(reviewedAuthor, "reviewedAuthor"));
}
var sourceline = text('#pub-heading .sourceline');
if (sourceline) {
item.publicationTitle = doc.querySelector('.sourceline i').textContent;
item.date = ZU.strToISO(doc.querySelector('.sourceline a').textContent);
item.pages = sourceline.replace(/.*p+\.\s(\d+(-\d+)?).*/,'$1'); // http://regexr.com/3du86
}
item.language = "en";
item.url = url.replace(/[?#].*/, '');
var pdfURL = doc.querySelector('iframe#insert-pdf');
if (pdfURL) {
pdfURL = pdfURL.getAttribute('src');
item.attachments.push({ // no need for snapshots, but download PDF if available
url: pdfURL,
title: item.title,
mimeType:"application/pdf"
});
}
item.complete();
}
function getSearchResults(doc, checkOnly, url) {
var items = {};
var found = false;
var rows;
if (url.includes('/Contents/')) {
rows = doc.querySelectorAll('.show .pub-text a.head');
} else {
rows = doc.querySelectorAll('.pub-text a.head');
}
for (let i=0; i<rows.length; i++) {
let href = rows[i].href;
let title = ZU.trimInternal(rows[i].textContent);
if (!href || !title) continue;
if (checkOnly) return true;
found = true;
items[href] = title;
}
return found ? items : false;
}
function doWeb(doc, url) {
switch (detectWeb(doc, url)) {
case "multiple":
Zotero.selectItems(getSearchResults(doc, false, url), function (items) {
if (!items) {
return true;
}
var articles = [];
for (var i in items) {
articles.push(i);
}
ZU.processDocuments(articles, scrape);
});
break;
case "magazineArticle":
scrape(doc, url);
break;
}
}
/** BEGIN TEST CASES **/
var testCases = [
{
"type": "web",
"url": "https://www.unz.com/print/NYRevBooks-1969nov20-00027",
"items": [
{
"itemType": "magazineArticle",
"title": "Can Technology Be Humane?",
"creators": [
{
"firstName": "Paul",
"lastName": "Goodman",
"creatorType": "author"
}
],
"date": "1969-11-20",
"language": "en",
"libraryCatalog": "UNZ",
"pages": "27-33",
"publicationTitle": "The New York Review of Books",
"url": "https://www.unz.com/print/NYRevBooks-1969nov20-00027",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
}
]
},
{
"type": "web",
"url": "https://www.unz.com/print/Freeman-1958oct-00058",
"items": [
{
"itemType": "magazineArticle",
"title": "Mental Prep vs. Pragmatic Tech",
"creators": [
{
"firstName": "John",
"lastName": "Chamberlain",
"creatorType": "author"
},
{
"firstName": "John",
"lastName": "Keats",
"creatorType": "reviewedAuthor"
}
],
"date": "1958-10",
"language": "en",
"libraryCatalog": "UNZ",
"pages": "58-61",
"publicationTitle": "The Freeman",
"url": "https://www.unz.com/print/Freeman-1958oct-00058",
"attachments": [
{
"title": "Mental Prep vs. Pragmatic Tech",
"mimeType": "application/pdf"
}
],
"tags": [],
"notes": [],
"seeAlso": []
}
]
},
{
"type": "web",
"url": "https://www.unz.com/print/author/GoodmanPaul/",
"items": "multiple"
},
{
"type": "web",
"url": "https://www.unz.com/print/Politics-1946nov",
"items": "multiple"
},
{
"type": "web",
"url": "https://www.unz.com/print/Harpers/Contents/?Period=1982",
"items": "multiple"
},
{
"type": "web",
"url": "https://www.unz.com/print/Search/?Author=goodman&ContentType=Print&PubType=All&Action=Search",
"items": "multiple"
},
{
"type": "web",
"url": "https://www.unz.com/print/NewRepublic-1943dec20-00878",
"items": [
{
"itemType": "magazineArticle",
"title": "Architecture in Wartime",
"creators": [
{
"firstName": "Percival",
"lastName": "Goodman",
"creatorType": "author"
},
{
"firstName": "Paul",
"lastName": "Goodman",
"creatorType": "author"
}
],
"date": "1943-12-20",
"language": "en",
"libraryCatalog": "UNZ",
"pages": "878-882",
"publicationTitle": "The New Republic",
"url": "https://www.unz.com/print/NewRepublic-1943dec20-00878",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
}
]
},
{
"type": "web",
"url": "https://www.unz.com/print/NYRevBooks-1970may21-00003/",
"items": [
{
"itemType": "magazineArticle",
"title": "Good Man",
"creators": [
{
"firstName": "Robert",
"lastName": "Mazzocco",
"creatorType": "author"
},
{
"firstName": "Paul",
"lastName": "Goodman",
"creatorType": "reviewedAuthor"
}
],
"date": "1970-05-21",
"language": "en",
"libraryCatalog": "UNZ",
"pages": "3-4",
"publicationTitle": "The New York Review of Books",
"url": "https://www.unz.com/print/NYRevBooks-1970may21-00003/",
"attachments": [],
"tags": [],
"notes": [],
"seeAlso": []
}
]
}
]
/** END TEST CASES **/