host = $host; $host->add_hook($host::HOOK_FETCH_FEED, $this); $host->add_hook($host::HOOK_FEED_BASIC_INFO, $this); $host->add_hook($host::HOOK_SUBSCRIBE_FEED, $this); $host->add_hook($host::HOOK_ARTICLE_FILTER, $this); $host->add_hook($host::HOOK_PREFS_TAB, $this); require_once __DIR__ . "/filter_base.php"; $filters = array_merge(glob(__DIR__ . "/filters.local/*.php"), glob(__DIR__ . "/filters/*.php")); $names = []; foreach ($filters as $file) { $filter_name = preg_replace("/\..*$/", "", basename($file)); if (array_search($filter_name, $names) === FALSE) { if (!class_exists($filter_name)) { require_once $file; } array_push($names, $filter_name); $filter = new $filter_name(); if (is_subclass_of($filter, "Af_ComicFilter")) { array_push($this->filters, $filter); array_push($names, $filter_name); } } } } function hook_prefs_tab($args) { if ($args != "prefFeeds") return; print "
"; } function hook_article_filter($article) { foreach ($this->filters as $f) { if ($f->process($article)) break; } return $article; } // GoComics dropped feed support so it needs to be handled when fetching the feed. // TODO: this should be split into individual methods provided by filters function hook_fetch_feed($feed_data, $fetch_url, $owner_uid, $feed, $last_article_timestamp, $auth_login, $auth_pass) { if ($auth_login || $auth_pass) return $feed_data; if (preg_match('#^https?://(?:feeds\.feedburner\.com/uclick|www\.gocomics\.com)/([-a-z0-9]+)$#i', $fetch_url, $comic)) { $site_url = 'https://www.gocomics.com/' . $comic[1]; $article_link = $site_url . date('/Y/m/d'); $body = fetch_file_contents(array('url' => $article_link, 'type' => 'text/html', 'followlocation' => false)); require_once 'lib/MiniTemplator.class.php'; $feed_title = htmlspecialchars($comic[1]); $site_url = htmlspecialchars($site_url); $article_link = htmlspecialchars($article_link); $tpl = new MiniTemplator(); $tpl->readTemplateFromFile('templates/generated_feed.txt'); $tpl->setVariable('FEED_TITLE', $feed_title, true); $tpl->setVariable('VERSION', get_version(), true); $tpl->setVariable('FEED_URL', htmlspecialchars($fetch_url), true); $tpl->setVariable('SELF_URL', $site_url, true); if ($body) { $doc = new DOMDocument(); if (@$doc->loadHTML($body)) { $xpath = new DOMXPath($doc); $node = $xpath->query('//picture[contains(@class, "item-comic-image")]/img')->item(0); if ($node) { $title = $xpath->query('//h1')->item(0); if ($title) { $title = clean(trim($title->nodeValue)); } else { $title = date('l, F d, Y'); } foreach (['srcset', 'sizes', 'data-srcset', 'width'] as $attr ) { $node->removeAttribute($attr); } $tpl->setVariable('ARTICLE_ID', $article_link, true); $tpl->setVariable('ARTICLE_LINK', $article_link, true); $tpl->setVariable('ARTICLE_UPDATED_ATOM', date('c', mktime(11, 0, 0)), true); $tpl->setVariable('ARTICLE_TITLE', htmlspecialchars($title), true); $tpl->setVariable('ARTICLE_EXCERPT', '', true); $tpl->setVariable('ARTICLE_CONTENT', $doc->saveHTML($node), true); $tpl->setVariable('ARTICLE_AUTHOR', '', true); $tpl->setVariable('ARTICLE_SOURCE_LINK', $site_url, true); $tpl->setVariable('ARTICLE_SOURCE_TITLE', $feed_title, true); $tpl->addBlock('entry'); } } } $tpl->addBlock('feed'); if ($tpl->generateOutputToString($tmp_data)) $feed_data = $tmp_data; } else if (preg_match("#^https?://www\.thefarside\.com#", $fetch_url)) { require_once 'lib/MiniTemplator.class.php'; $article_link = htmlspecialchars("https://www.thefarside.com" . date('/Y/m/d')); $tpl = new MiniTemplator(); $tpl->readTemplateFromFile('templates/generated_feed.txt'); $tpl->setVariable('FEED_TITLE', "The Far Side", true); $tpl->setVariable('VERSION', get_version(), true); $tpl->setVariable('FEED_URL', htmlspecialchars($fetch_url), true); $tpl->setVariable('SELF_URL', htmlspecialchars($fetch_url), true); $body = fetch_file_contents(['url' => $article_link, 'type' => 'text/html', 'followlocation' => false]); if ($body) { $doc = new DOMDocument(); if (@$doc->loadHTML($body)) { $xpath = new DOMXPath($doc); $content_node = $xpath->query('//*[contains(@class,"js-daily-dose")]')->item(0); if ($content_node) { $imgs = $xpath->query('//img[@data-src]', $content_node); foreach ($imgs as $img) { $img->setAttribute('src', $img->getAttribute('data-src')); } $junk_elems = $xpath->query("//*[@data-shareable-popover]"); foreach ($junk_elems as $junk) $junk->parentNode->removeChild($junk); $title = $xpath->query('//h3')->item(0); if ($title) { $title = clean(trim($title->nodeValue)); } else { $title = date('l, F d, Y'); } $tpl->setVariable('ARTICLE_ID', htmlspecialchars($article_link), true); $tpl->setVariable('ARTICLE_LINK', htmlspecialchars($article_link), true); $tpl->setVariable('ARTICLE_UPDATED_ATOM', date('c', mktime(11, 0, 0)), true); $tpl->setVariable('ARTICLE_TITLE', htmlspecialchars($title), true); $tpl->setVariable('ARTICLE_EXCERPT', '', true); $tpl->setVariable('ARTICLE_CONTENT', "" . $doc->saveHTML($content_node) . "
", true); $tpl->setVariable('ARTICLE_AUTHOR', '', true); $tpl->setVariable('ARTICLE_SOURCE_LINK', htmlspecialchars($article_link), true); $tpl->setVariable('ARTICLE_SOURCE_TITLE', "The Far Side", true); $tpl->addBlock('entry'); } } } $tpl->addBlock('feed'); if ($tpl->generateOutputToString($tmp_data)) $feed_data = $tmp_data; } return $feed_data; } function hook_subscribe_feed($contents, $url, $auth_login, $auth_pass) { if ($auth_login || $auth_pass) return $contents; if (preg_match('#^https?://www\.gocomics\.com/([-a-z0-9]+)$#i', $url) || preg_match("#^https?://www\.thefarside\.com#", $url)) return ''; // Get is_html() to return false. return $contents; } function hook_feed_basic_info($basic_info, $fetch_url, $owner_uid, $feed, $auth_login, $auth_pass) { if ($auth_login || $auth_pass) return $basic_info; if (preg_match('#^https?://www\.gocomics\.com/([-a-z0-9]+)$#i', $fetch_url, $matches)) $basic_info = ['title' => ucfirst($matches[1]), 'site_url' => $matches[0]]; if (preg_match("#^https?://www.thefarside.com/#", $fetch_url)) $basic_info = ['title' => "The Far Side", 'site_url' => 'https://www.thefarside.com']; return $basic_info; } function api_version() { return 2; } }