zotero-db/translators/dLibra.js

368 lines
9.6 KiB
JavaScript

{
"translatorID": "915e3ae2-afa9-4b1d-9780-28ed3defe0ab",
"label": "dLibra",
"creator": "Pawel Kolodziej <p.kolodziej@gmail.com> and Kamil Gronowski <kgronowski@man.poznan.pl>",
"target": "/.*dlibra/(doccontent|docmetadata|collectiondescription|results)|/dlibra/?",
"minVersion": "2.1.9",
"maxVersion": "",
"priority": 100,
"inRepository": true,
"translatorType": 4,
"browserSupport": "gcsibv",
"lastUpdated": "2021-10-21 04:23:31"
}
/*
***** BEGIN LICENSE BLOCK *****
Copyright © 2021 Pawel Kolodziej, Kamil Gronowski
This file is part of Zotero.
Zotero is free software: you can redistribute it and/or modify
it under the terms of the GNU Affero General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
Zotero is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU Affero General Public License for more details.
You should have received a copy of the GNU Affero General Public License
along with Zotero. If not, see <http://www.gnu.org/licenses/>.
***** END LICENSE BLOCK *****
*/
let POLISH_TYPE_MAPPINGS = {
"dokument dźwiękowy": "audioRecording",
książka: "book",
rozdział: "bookSection",
artykuł: "journalArticle",
czasopismo: "journalArticle",
Article: "journalArticle", // not Polish, but also present sometimes
manuskrypt: "manuscript",
rękopis: "manuscript",
mapa: "map",
raport: "report",
"praca dyplomowa": "thesis",
"rozprawa doktorska": "thesis"
};
function detectWeb(doc, url) {
let singleRe = /dlibra\/(doccontent|docmetadata|publication)/;
if (singleRe.test(url)) {
let types = Array.from(doc.querySelectorAll('meta[name="DC.type"]')).map(meta => meta.content);
let type;
for (let possibleType of types) {
if (POLISH_TYPE_MAPPINGS[possibleType]) {
type = POLISH_TYPE_MAPPINGS[possibleType];
break;
}
type = possibleType;
}
return (type && ZU.itemTypeExists(type)) ? type : "document";
}
if (getSearchResults(doc, true)) {
return "multiple";
}
return false;
}
function doWeb(doc, url) {
if (detectWeb(doc, url) == "multiple") {
Zotero.selectItems(getSearchResults(doc, false), function (items) {
if (!items) {
return true;
}
ZU.processDocuments(Object.keys(items), scrape);
return false;
});
}
else {
scrape(doc, url);
}
return false;
}
function getSearchResults(doc, checkOnly) {
let items = {};
let found = false;
// dLibra 5
let rows = doc.querySelectorAll('.dLSearchResultTitle');
if (rows.length) {
for (let row of rows) {
let href = row.href;
let title = ZU.trimInternal(text(row, '#src_titleLink_fullTitle > span.src_titleLink_title'));
if (!href || !title) continue;
if (checkOnly) return true;
found = true;
items[href] = title;
}
}
else {
// dLibra 6
rows = doc.querySelectorAll('.objectbox__text--title');
if (!rows.length) rows = doc.querySelectorAll('.item__link--title');
for (let row of rows) {
// skip 'Similar in FBC'
if (row.getAttribute('title')) {
let href = attr(row, 'a', 'href') || row.href;
let title = ZU.trimInternal(
row.classList.contains('item__link--title')
? row.textContent
: row.getAttribute('title'));
if (!href || !title) continue;
if (checkOnly) return true;
found = true;
items[href] = title;
}
}
}
return found ? items : false;
}
function scrape(doc, url) {
let reDlibra5Single = new RegExp("((.*/dlibra)/(?:doccontent|docmetadata|publication).*[?&]id=([0-9]*)).*");
let m = reDlibra5Single.exec(url);
if (m) {
dlibraScrape(doc, m[1], m[2], "e", m[3]);
}
else {
let reDlibra6Single = new RegExp("((.*/dlibra)/publication/([0-9]*)(/edition/([0-9]*))?).*");
let m = reDlibra6Single.exec(url);
if (m) {
if (m[4]) {
dlibraScrape(doc, m[1], m[2], "e", m[5]);
}
else {
dlibraScrape(doc, m[1], m[2], "p", m[3]);
}
}
}
}
function dlibraScrape(doc, objUrl, baseUrl, objType, id) {
ZU.HTTP.doGet(baseUrl + "/rdf.xml?type=" + objType + "&id=" + id, function (rdf) {
rdf = rdf.replace(/<\?xml[^>]*\?>/, "");
let dcTypeRegex = /<dc:type[^>]*>([^<]+)<\/dc:type>/gi;
let m, type;
while ((m = dcTypeRegex.exec(rdf))) {
if (POLISH_TYPE_MAPPINGS[m[1]]) {
type = POLISH_TYPE_MAPPINGS[m[1]];
break;
}
}
let translator = Zotero.loadTranslator("import");
// RDF importer
translator.setTranslator("5e3ad958-ac79-463d-812b-a86a9235c28f");
translator.setString(rdf);
translator.setHandler("itemDone", function (obj, item) {
item.url = objUrl;
item.itemID = "";
addAttachments(doc, item);
item.complete();
});
translator.getTranslatorObject(function (trans) {
if (type) {
trans.defaultUnknownType = type;
}
trans.doImport();
});
});
}
function addAttachments(doc, item) {
let pdfURL = ZU.xpath(doc, '//meta[@name="citation_pdf_url"]/@content');
if (pdfURL.length) {
pdfURL = pdfURL[0].textContent;
item.attachments.push({ title: "Full Text PDF", url: pdfURL, mimeType: "application/pdf" });
}
item.attachments.push({ document: doc, title: "Snapshot" });
}
function attr(docOrElem, selector, attr, index) {
let elem = index ? docOrElem.querySelectorAll(selector).item(index) : docOrElem.querySelector(selector);
return elem ? elem.getAttribute(attr) : null;
}
function text(docOrElem, selector, index) {
let elem = index ? docOrElem.querySelectorAll(selector).item(index) : docOrElem.querySelector(selector);
return elem ? elem.textContent : null;
}
/** BEGIN TEST CASES **/
var testCases = [
{
"type": "web",
"url": "http://mbc.cyfrowemazowsze.pl/dlibra/docmetadata?id=84344",
"items": [
{
"itemType": "journalArticle",
"title": "Przegląd Sportowy : tygodnik ilustrowany, poświęcony wszelkim gałęziom sportu : oficjalny organ Polskiego Związku Piłki Nożnej oraz Krakowskiego, Warszawskiego, Lwowskiego i Łódzkiego Związku Okręgowego Piłki Nożnej. R. 2, 1922 nr 6 (10 II)",
"creators": [
{
"firstName": "Tadeusz (1889-1960) Red odpowiedzialny",
"lastName": "Synowiec",
"creatorType": "author"
}
],
"date": "1922",
"abstractNote": "16 s. : il. ; 31 cm",
"language": "pol",
"libraryCatalog": "dLibra",
"publisher": "Dembiński, Aleksander",
"rights": "Licencja udzielona Bibliotece Głównej im. Jędrzeja Śniadeckiego Akademii Wychowania Fizycznego Józefa Piłsudskiego w Warszawie",
"shortTitle": "Przegląd Sportowy",
"url": "http://mbc.cyfrowemazowsze.pl/dlibra/docmetadata?id=84344",
"attachments": [
{
"title": "Full Text PDF",
"mimeType": "application/pdf"
},
{
"title": "Snapshot",
"mimeType": "text/html"
}
],
"tags": [
{
"tag": "wiadomości sportowe"
},
{
"tag": "sport"
},
{
"tag": "czasopismo sportowe"
},
{
"tag": "prasa polska"
}
],
"notes": [],
"seeAlso": []
}
]
},
{
"type": "web",
"url": "https://demo.dl.psnc.pl/dlibra/planned?action=SimpleSearchAction&type=-6&p=0",
"items": "multiple"
},
{
"type": "web",
"url": "https://demo.dl.psnc.pl/dlibra/collectiondescription/1",
"items": "multiple"
},
{
"type": "web",
"url": "https://demo.dl.psnc.pl/dlibra/results?q=*&action=SimpleSearchAction&type=-6&p=0",
"items": "multiple"
},
{
"type": "web",
"url": "https://demo.dl.psnc.pl/dlibra/publication/1502/edition/1243",
"items": [
{
"itemType": "book",
"title": "Pan Tadeusz",
"creators": [
{
"firstName": "Adam",
"lastName": "Mickiewicz",
"creatorType": "author"
}
],
"date": "1882",
"abstractNote": "Epilog",
"language": "pol",
"libraryCatalog": "dLibra",
"publisher": "Lwów, Nakładem Księgarni F. H. Richtera. (H. Altbenberg)",
"rights": "Open Access",
"url": "https://demo.dl.psnc.pl/dlibra/publication/1502/edition/1243",
"attachments": [
{
"title": "Full Text PDF",
"mimeType": "application/pdf"
},
{
"title": "Snapshot",
"mimeType": "text/html"
}
],
"tags": [
{
"tag": "poezja"
},
{
"tag": "poezja polska"
}
],
"notes": [],
"seeAlso": []
}
]
},
{
"type": "web",
"url": "https://journals.pan.pl/dlibra/publication/99314/edition/118913/content",
"items": [
{
"itemType": "journalArticle",
"title": "Test laboratoryjny dla oceny tunelowania metodą EPB: wyniki testów dla dwóch różnych gruntów ziarnistych",
"creators": [
{
"firstName": "Daniele",
"lastName": "Peila",
"creatorType": "author"
},
{
"firstName": "Luca",
"lastName": "Borio",
"creatorType": "author"
}
],
"date": "2011",
"ISSN": "0860-0953",
"libraryCatalog": "dLibra",
"publicationTitle": "Gospodarka Surowcami Mineralnymi - Mineral Resources Management; 2011; No 1; 85-100",
"shortTitle": "Test laboratoryjny dla oceny tunelowania metodą EPB",
"url": "https://journals.pan.pl/dlibra/publication/99314/edition/118913",
"attachments": [
{
"title": "Full Text PDF",
"mimeType": "application/pdf"
},
{
"title": "Snapshot",
"mimeType": "text/html"
}
],
"tags": [
{
"tag": "EPB tunnelling"
},
{
"tag": "Nauki Techniczne"
},
{
"tag": "risk management"
},
{
"tag": "soil conditioning"
}
],
"notes": [],
"seeAlso": []
}
]
},
{
"type": "web",
"url": "https://journals.pan.pl/dlibra/results?q=test&action=SimpleSearchAction&mdirids=&type=-6&startstr=_all&p=0",
"items": "multiple"
}
]
/** END TEST CASES **/