244 lines
6.5 KiB
JavaScript
244 lines
6.5 KiB
JavaScript
|
{
|
||
|
"translatorID": "6f9aa90d-6631-4459-81ef-a0758d2e3921",
|
||
|
"label": "Blogger",
|
||
|
"creator": "Adam Crymble",
|
||
|
"target": "\\.blogspot\\.com",
|
||
|
"minVersion": "3.0",
|
||
|
"maxVersion": "",
|
||
|
"priority": 100,
|
||
|
"inRepository": true,
|
||
|
"translatorType": 4,
|
||
|
"browserSupport": "gcsibv",
|
||
|
"lastUpdated": "2016-09-05 23:14:05"
|
||
|
}
|
||
|
|
||
|
function detectWeb(doc, url) {
|
||
|
var result = doc.evaluate('//h3[contains(@class,"post-title") and contains(@class,"entry-title")]', doc, null, XPathResult.ANY_TYPE, null);
|
||
|
var entry = result.iterateNext();
|
||
|
if (entry && result.iterateNext()) {
|
||
|
return "multiple";
|
||
|
} else if (entry) {
|
||
|
return "blogPost";
|
||
|
} else {
|
||
|
return false;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
|
||
|
function getSearchResults(doc, checkOnly) {
|
||
|
var items = {};
|
||
|
var found = false;
|
||
|
var rows = ZU.xpath(doc, '//h3[@class="post-title entry-title"]/a|//li[@class="archivedate expanded"]/ul[@class="posts"]/li/a');
|
||
|
for (var i=0; i<rows.length; i++) {
|
||
|
var href = rows[i].href;
|
||
|
var title = ZU.trimInternal(rows[i].textContent);
|
||
|
if (!href || !title) continue;
|
||
|
if (checkOnly) return true;
|
||
|
found = true;
|
||
|
items[href] = title;
|
||
|
}
|
||
|
return found ? items : false;
|
||
|
}
|
||
|
//Blogger translator. Code by Adam Crymble
|
||
|
|
||
|
function scrape(doc, url) {
|
||
|
var tagsContent = new Array();
|
||
|
var newItem = new Zotero.Item("blogPost");
|
||
|
|
||
|
//title
|
||
|
if (ZU.xpathText(doc, '//h3[@class="post-title entry-title"]/a')) {
|
||
|
newItem.title = ZU.xpathText(doc, '//h3[@class="post-title entry-title"]/a');
|
||
|
} else {
|
||
|
newItem.title = doc.title;
|
||
|
}
|
||
|
|
||
|
//author, if available
|
||
|
if (ZU.xpathText(doc, '//span[@class="post-author vcard"]//span[@class="fn"]')) {
|
||
|
var author = ZU.xpathText(doc, '//span[@class="post-author vcard"]//span[@class="fn"]').trim();
|
||
|
var author = author.toLowerCase();
|
||
|
if (author.match(/\sby\s/)) {
|
||
|
var shortenAuthor = author.indexOf(" by");
|
||
|
author = author.substr(shortenAuthor + 3).replace(/^\s*|\s$/g, '');
|
||
|
}
|
||
|
var words = author.split(/\s/);
|
||
|
for (var i in words) {
|
||
|
words[i] = words[i].substr(0, 1).toUpperCase() + words[i].substr(1).toLowerCase();
|
||
|
}
|
||
|
author = words.join(" ");
|
||
|
newItem.creators.push(Zotero.Utilities.cleanAuthor(author, "author"));
|
||
|
}
|
||
|
|
||
|
//date, if available
|
||
|
newItem.date = ZU.xpathText(doc, '//h2[@class="date-header"]');
|
||
|
|
||
|
|
||
|
//tags, if available
|
||
|
var tags = ZU.xpath(doc, '//span[@class="post-labels"]/a');
|
||
|
for (var i = 0; i < tags.length; i++) {
|
||
|
newItem.tags.push(tags[i].textContent);
|
||
|
}
|
||
|
|
||
|
var blogTitle1 = doc.title.split(":");
|
||
|
var cleanurl = url.replace(/[\?#].+/, "");
|
||
|
newItem.blogTitle = blogTitle1[0];
|
||
|
newItem.url=cleanurl;
|
||
|
newItem.attachments = [{url:cleanurl, title:"Blogspot Snapshot", mimeType: "text/html"}];
|
||
|
|
||
|
newItem.complete();
|
||
|
}
|
||
|
|
||
|
|
||
|
function doWeb(doc, url) {
|
||
|
var articles = new Array();
|
||
|
|
||
|
if (detectWeb(doc, url) == "multiple") {
|
||
|
Zotero.selectItems(getSearchResults(doc, false), function(items) {
|
||
|
if (!items) {
|
||
|
return true;
|
||
|
}
|
||
|
var articles = [];
|
||
|
for (var i in items) {
|
||
|
articles.push(i);
|
||
|
}
|
||
|
ZU.processDocuments(articles, scrape);
|
||
|
});
|
||
|
} else {
|
||
|
scrape(doc, url);
|
||
|
}
|
||
|
}/** BEGIN TEST CASES **/
|
||
|
var testCases = [
|
||
|
{
|
||
|
"type": "web",
|
||
|
"url": "http://observationalepidemiology.blogspot.com/2011/10/tweet-from-matt-yglesias.html",
|
||
|
"items": [
|
||
|
{
|
||
|
"itemType": "blogPost",
|
||
|
"title": "A tweet from Matt Yglesias",
|
||
|
"creators": [
|
||
|
{
|
||
|
"firstName": "",
|
||
|
"lastName": "Joseph",
|
||
|
"creatorType": "author"
|
||
|
}
|
||
|
],
|
||
|
"date": "Monday, October 24, 2011",
|
||
|
"accessDate": "CURRENT_TIMESTAMP",
|
||
|
"blogTitle": "West Coast Stat Views (on Observational Epidemiology and more)",
|
||
|
"libraryCatalog": "Blogger",
|
||
|
"url": "http://observationalepidemiology.blogspot.com/2011/10/tweet-from-matt-yglesias.html",
|
||
|
"attachments": [
|
||
|
{
|
||
|
"title": "Blogspot Snapshot",
|
||
|
"mimeType": "text/html"
|
||
|
}
|
||
|
],
|
||
|
"tags": [
|
||
|
"Mark",
|
||
|
"Matthew Yglesias"
|
||
|
],
|
||
|
"notes": [],
|
||
|
"seeAlso": []
|
||
|
}
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"type": "web",
|
||
|
"url": "http://observationalepidemiology.blogspot.com/",
|
||
|
"items": "multiple"
|
||
|
},
|
||
|
{
|
||
|
"type": "web",
|
||
|
"url": "http://argentina-politica.blogspot.com/2012/03/perciben-una-caida-en-la-imagen-de-la.html",
|
||
|
"items": [
|
||
|
{
|
||
|
"itemType": "blogPost",
|
||
|
"title": "Politica Argentina - Blog de Psicología Política de Federico González: Perciben una caída en la imagen de la Presidenta",
|
||
|
"creators": [
|
||
|
{
|
||
|
"firstName": "Federico",
|
||
|
"lastName": "Gonzalez",
|
||
|
"creatorType": "author"
|
||
|
}
|
||
|
],
|
||
|
"date": "domingo, 11 de marzo de 2012",
|
||
|
"blogTitle": "Politica Argentina - Blog de Psicología Política de Federico González",
|
||
|
"shortTitle": "Politica Argentina - Blog de Psicología Política de Federico González",
|
||
|
"url": "http://argentina-politica.blogspot.com/2012/03/perciben-una-caida-en-la-imagen-de-la.html",
|
||
|
"attachments": [
|
||
|
{
|
||
|
"title": "Blogspot Snapshot",
|
||
|
"mimeType": "text/html"
|
||
|
}
|
||
|
],
|
||
|
"tags": [
|
||
|
"Cristina Kirchner",
|
||
|
"imagen"
|
||
|
],
|
||
|
"notes": [],
|
||
|
"seeAlso": []
|
||
|
}
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"type": "web",
|
||
|
"url": "http://utotherescue.blogspot.com/2013/11/the-heart-of-matter-humanities-do-more.html",
|
||
|
"items": [
|
||
|
{
|
||
|
"itemType": "blogPost",
|
||
|
"title": "National Humanities Report Reinforces Stereotypes about the Humanities ~ Remaking the University",
|
||
|
"creators": [
|
||
|
{
|
||
|
"firstName": "Michael",
|
||
|
"lastName": "Meranze",
|
||
|
"creatorType": "author"
|
||
|
}
|
||
|
],
|
||
|
"date": "Monday, November 25, 2013",
|
||
|
"blogTitle": "National Humanities Report Reinforces Stereotypes about the Humanities ~ Remaking the University",
|
||
|
"url": "http://utotherescue.blogspot.com/2013/11/the-heart-of-matter-humanities-do-more.html",
|
||
|
"attachments": [
|
||
|
{
|
||
|
"title": "Blogspot Snapshot",
|
||
|
"mimeType": "text/html"
|
||
|
}
|
||
|
],
|
||
|
"tags": [
|
||
|
"Cuts",
|
||
|
"Development",
|
||
|
"Humanities",
|
||
|
"Liberal Arts",
|
||
|
"guest post"
|
||
|
],
|
||
|
"notes": [],
|
||
|
"seeAlso": []
|
||
|
}
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"type": "web",
|
||
|
"url": "https://jamsubuntu.blogspot.com/2009/01/unmount-command-not-found.html",
|
||
|
"items": [
|
||
|
{
|
||
|
"itemType": "blogPost",
|
||
|
"title": "Jam's Ubuntu Linux Blog: unmount: command not found",
|
||
|
"creators": [],
|
||
|
"date": "Wednesday, 7 January 2009",
|
||
|
"blogTitle": "Jam's Ubuntu Linux Blog",
|
||
|
"shortTitle": "Jam's Ubuntu Linux Blog",
|
||
|
"url": "https://jamsubuntu.blogspot.com/2009/01/unmount-command-not-found.html",
|
||
|
"attachments": [
|
||
|
{
|
||
|
"title": "Blogspot Snapshot",
|
||
|
"mimeType": "text/html"
|
||
|
}
|
||
|
],
|
||
|
"tags": [
|
||
|
"Command Line"
|
||
|
],
|
||
|
"notes": [],
|
||
|
"seeAlso": []
|
||
|
}
|
||
|
]
|
||
|
}
|
||
|
]
|
||
|
/** END TEST CASES **/
|