ttrss/plugins/af_comics/init.php

256 lines
7.7 KiB
PHP
Raw Normal View History

<?php
class Af_Comics extends Plugin {
private $host;
private $filters = array();
function about() {
return array(2.0,
"Fixes RSS feeds of assorted comic strips",
"fox");
}
function init($host) {
$this->host = $host;
$host->add_hook($host::HOOK_FETCH_FEED, $this);
$host->add_hook($host::HOOK_FEED_BASIC_INFO, $this);
$host->add_hook($host::HOOK_SUBSCRIBE_FEED, $this);
$host->add_hook($host::HOOK_ARTICLE_FILTER, $this);
$host->add_hook($host::HOOK_PREFS_TAB, $this);
require_once __DIR__ . "/filter_base.php";
$filters = array_merge(glob(__DIR__ . "/filters.local/*.php"), glob(__DIR__ . "/filters/*.php"));
$names = [];
foreach ($filters as $file) {
$filter_name = preg_replace("/\..*$/", "", basename($file));
if (array_search($filter_name, $names) === FALSE) {
if (!class_exists($filter_name)) {
require_once $file;
}
array_push($names, $filter_name);
$filter = new $filter_name();
if (is_subclass_of($filter, "Af_ComicFilter")) {
array_push($this->filters, $filter);
array_push($names, $filter_name);
}
2014-02-17 08:26:46 +00:00
}
}
}
function hook_prefs_tab($args) {
if ($args != "prefFeeds") return;
print "<div dojoType=\"dijit.layout.AccordionPane\"
title=\"<i class='material-icons'>photo</i> ".__('Feeds supported by af_comics')."\">";
print "<p>" . __("The following comics are currently supported:") . "</p>";
$comics = ["GoComics", "The Far Side"];
foreach ($this->filters as $f) {
foreach ($f->supported() as $comic) {
array_push($comics, $comic);
}
}
asort($comics);
print "<ul class='panel panel-scrollable list list-unstyled'>";
foreach ($comics as $comic) {
print "<li>$comic</li>";
}
print "</ul>";
print "<p>".__("To subscribe to GoComics use the comic's regular web page as the feed URL (e.g. for the <em>Garfield</em> comic use <code>http://www.gocomics.com/garfield</code>).")."</p>";
print "<p>".__('Drop any updated filters into <code>filters.local</code> in plugin directory.')."</p>";
print "</div>";
}
function hook_article_filter($article) {
foreach ($this->filters as $f) {
if ($f->process($article))
break;
}
return $article;
}
// GoComics dropped feed support so it needs to be handled when fetching the feed.
// TODO: this should be split into individual methods provided by filters
function hook_fetch_feed($feed_data, $fetch_url, $owner_uid, $feed, $last_article_timestamp, $auth_login, $auth_pass) {
if ($auth_login || $auth_pass)
return $feed_data;
if (preg_match('#^https?://(?:feeds\.feedburner\.com/uclick|www\.gocomics\.com)/([-a-z0-9]+)$#i', $fetch_url, $comic)) {
2018-05-12 17:31:52 +00:00
$site_url = 'https://www.gocomics.com/' . $comic[1];
$article_link = $site_url . date('/Y/m/d');
$body = fetch_file_contents(array('url' => $article_link, 'type' => 'text/html', 'followlocation' => false));
require_once 'lib/MiniTemplator.class.php';
$feed_title = htmlspecialchars($comic[1]);
$site_url = htmlspecialchars($site_url);
$article_link = htmlspecialchars($article_link);
$tpl = new MiniTemplator();
$tpl->readTemplateFromFile('templates/generated_feed.txt');
$tpl->setVariable('FEED_TITLE', $feed_title, true);
$tpl->setVariable('VERSION', get_version(), true);
$tpl->setVariable('FEED_URL', htmlspecialchars($fetch_url), true);
$tpl->setVariable('SELF_URL', $site_url, true);
if ($body) {
$doc = new DOMDocument();
if (@$doc->loadHTML($body)) {
$xpath = new DOMXPath($doc);
$node = $xpath->query('//picture[contains(@class, "item-comic-image")]/img')->item(0);
if ($node) {
$title = $xpath->query('//h1')->item(0);
if ($title) {
$title = clean(trim($title->nodeValue));
} else {
$title = date('l, F d, Y');
}
foreach (['srcset', 'sizes', 'data-srcset', 'width'] as $attr ) {
$node->removeAttribute($attr);
}
$tpl->setVariable('ARTICLE_ID', $article_link, true);
$tpl->setVariable('ARTICLE_LINK', $article_link, true);
$tpl->setVariable('ARTICLE_UPDATED_ATOM', date('c', mktime(11, 0, 0)), true);
$tpl->setVariable('ARTICLE_TITLE', htmlspecialchars($title), true);
$tpl->setVariable('ARTICLE_EXCERPT', '', true);
$tpl->setVariable('ARTICLE_CONTENT', $doc->saveHTML($node), true);
$tpl->setVariable('ARTICLE_AUTHOR', '', true);
$tpl->setVariable('ARTICLE_SOURCE_LINK', $site_url, true);
$tpl->setVariable('ARTICLE_SOURCE_TITLE', $feed_title, true);
$tpl->addBlock('entry');
}
}
}
$tpl->addBlock('feed');
if ($tpl->generateOutputToString($tmp_data))
$feed_data = $tmp_data;
} else if (preg_match("#^https?://www\.thefarside\.com#", $fetch_url)) {
require_once 'lib/MiniTemplator.class.php';
2020-02-27 07:24:12 +00:00
$article_link = htmlspecialchars("https://www.thefarside.com" . date('/Y/m/d'));
$tpl = new MiniTemplator();
$tpl->readTemplateFromFile('templates/generated_feed.txt');
$tpl->setVariable('FEED_TITLE', "The Far Side", true);
$tpl->setVariable('VERSION', get_version(), true);
$tpl->setVariable('FEED_URL', htmlspecialchars($fetch_url), true);
$tpl->setVariable('SELF_URL', htmlspecialchars($fetch_url), true);
2020-02-27 07:24:12 +00:00
$body = fetch_file_contents(['url' => $article_link, 'type' => 'text/html', 'followlocation' => false]);
if ($body) {
$doc = new DOMDocument();
if (@$doc->loadHTML($body)) {
$xpath = new DOMXPath($doc);
$content_node = $xpath->query('//*[contains(@class,"js-daily-dose")]')->item(0);
if ($content_node) {
$imgs = $xpath->query('//img[@data-src]', $content_node);
foreach ($imgs as $img) {
$img->setAttribute('src', $img->getAttribute('data-src'));
}
$junk_elems = $xpath->query("//*[@data-shareable-popover]");
foreach ($junk_elems as $junk)
$junk->parentNode->removeChild($junk);
$title = $xpath->query('//h3')->item(0);
if ($title) {
$title = clean(trim($title->nodeValue));
} else {
$title = date('l, F d, Y');
}
2020-02-27 07:24:12 +00:00
$tpl->setVariable('ARTICLE_ID', htmlspecialchars($article_link), true);
$tpl->setVariable('ARTICLE_LINK', htmlspecialchars($article_link), true);
$tpl->setVariable('ARTICLE_UPDATED_ATOM', date('c', mktime(11, 0, 0)), true);
$tpl->setVariable('ARTICLE_TITLE', htmlspecialchars($title), true);
$tpl->setVariable('ARTICLE_EXCERPT', '', true);
$tpl->setVariable('ARTICLE_CONTENT', "<p> " . $doc->saveHTML($content_node) . "</p>", true);
$tpl->setVariable('ARTICLE_AUTHOR', '', true);
$tpl->setVariable('ARTICLE_SOURCE_LINK', $article_link, true);
$tpl->setVariable('ARTICLE_SOURCE_TITLE', "The Far Side", true);
$tpl->addBlock('entry');
}
}
}
$tpl->addBlock('feed');
if ($tpl->generateOutputToString($tmp_data))
$feed_data = $tmp_data;
}
return $feed_data;
}
function hook_subscribe_feed($contents, $url, $auth_login, $auth_pass) {
if ($auth_login || $auth_pass)
return $contents;
if (preg_match('#^https?://www\.gocomics\.com/([-a-z0-9]+)$#i', $url) ||
preg_match("#^https?://www\.thefarside\.com#", $url))
return '<?xml version="1.0" encoding="utf-8"?>'; // Get is_html() to return false.
return $contents;
}
function hook_feed_basic_info($basic_info, $fetch_url, $owner_uid, $feed, $auth_login, $auth_pass) {
if ($auth_login || $auth_pass)
return $basic_info;
if (preg_match('#^https?://www\.gocomics\.com/([-a-z0-9]+)$#i', $fetch_url, $matches))
$basic_info = ['title' => ucfirst($matches[1]), 'site_url' => $matches[0]];
if (preg_match("#^https?://www.thefarside.com/#", $fetch_url))
$basic_info = ['title' => "The Far Side", 'site_url' => 'https://www.thefarside.com'];
return $basic_info;
}
function api_version() {
return 2;
}
}