2015-07-06 20:02:21 +00:00
|
|
|
<?php
|
|
|
|
class Af_Readability extends Plugin {
|
|
|
|
|
|
|
|
private $host;
|
|
|
|
|
|
|
|
function about() {
|
|
|
|
return array(1.0,
|
|
|
|
"Try to inline article content using Readability",
|
|
|
|
"fox");
|
|
|
|
}
|
|
|
|
|
|
|
|
function save() {
|
|
|
|
//
|
|
|
|
}
|
|
|
|
|
|
|
|
function init($host)
|
|
|
|
{
|
|
|
|
$this->host = $host;
|
|
|
|
|
|
|
|
$host->add_hook($host::HOOK_ARTICLE_FILTER, $this);
|
|
|
|
$host->add_hook($host::HOOK_PREFS_TAB, $this);
|
|
|
|
$host->add_hook($host::HOOK_PREFS_EDIT_FEED, $this);
|
|
|
|
$host->add_hook($host::HOOK_PREFS_SAVE_FEED, $this);
|
2015-08-12 09:16:07 +00:00
|
|
|
|
|
|
|
$host->add_filter_action($this, "action_inline", __("Inline content"));
|
2015-07-06 20:02:21 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
function hook_prefs_tab($args) {
|
|
|
|
if ($args != "prefFeeds") return;
|
|
|
|
|
|
|
|
print "<div dojoType=\"dijit.layout.AccordionPane\" title=\"".__('af_readability settings')."\">";
|
|
|
|
|
|
|
|
print_notice("Enable the plugin for specific feeds in the feed editor.");
|
|
|
|
|
|
|
|
$enabled_feeds = $this->host->get($this, "enabled_feeds");
|
|
|
|
if (!array($enabled_feeds)) $enabled_feeds = array();
|
|
|
|
|
|
|
|
$enabled_feeds = $this->filter_unknown_feeds($enabled_feeds);
|
|
|
|
$this->host->set($this, "enabled_feeds", $enabled_feeds);
|
|
|
|
|
|
|
|
if (count($enabled_feeds) > 0) {
|
|
|
|
print "<h3>" . __("Currently enabled for (click to edit):") . "</h3>";
|
|
|
|
|
|
|
|
print "<ul class=\"browseFeedList\" style=\"border-width : 1px\">";
|
|
|
|
foreach ($enabled_feeds as $f) {
|
|
|
|
print "<li>" .
|
|
|
|
"<img src='images/pub_set.png'
|
|
|
|
style='vertical-align : middle'> <a href='#'
|
|
|
|
onclick='editFeed($f)'>".
|
|
|
|
getFeedTitle($f) . "</a></li>";
|
|
|
|
}
|
|
|
|
print "</ul>";
|
|
|
|
}
|
|
|
|
|
|
|
|
print "</div>";
|
|
|
|
}
|
|
|
|
|
|
|
|
function hook_prefs_edit_feed($feed_id) {
|
|
|
|
print "<div class=\"dlgSec\">".__("Readability")."</div>";
|
|
|
|
print "<div class=\"dlgSecCont\">";
|
|
|
|
|
|
|
|
$enabled_feeds = $this->host->get($this, "enabled_feeds");
|
|
|
|
if (!array($enabled_feeds)) $enabled_feeds = array();
|
|
|
|
|
|
|
|
$key = array_search($feed_id, $enabled_feeds);
|
|
|
|
$checked = $key !== FALSE ? "checked" : "";
|
|
|
|
|
|
|
|
print "<hr/><input dojoType=\"dijit.form.CheckBox\" type=\"checkbox\" id=\"af_readability_enabled\"
|
|
|
|
name=\"af_readability_enabled\"
|
|
|
|
$checked> <label for=\"af_readability_enabled\">".__('Inline article content')."</label>";
|
|
|
|
|
|
|
|
print "</div>";
|
|
|
|
}
|
|
|
|
|
|
|
|
function hook_prefs_save_feed($feed_id) {
|
|
|
|
$enabled_feeds = $this->host->get($this, "enabled_feeds");
|
|
|
|
if (!is_array($enabled_feeds)) $enabled_feeds = array();
|
|
|
|
|
|
|
|
$enable = checkbox_to_sql_bool($_POST["af_readability_enabled"]) == 'true';
|
|
|
|
$key = array_search($feed_id, $enabled_feeds);
|
|
|
|
|
|
|
|
if ($enable) {
|
|
|
|
if ($key === FALSE) {
|
|
|
|
array_push($enabled_feeds, $feed_id);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if ($key !== FALSE) {
|
|
|
|
unset($enabled_feeds[$key]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
$this->host->set($this, "enabled_feeds", $enabled_feeds);
|
|
|
|
}
|
|
|
|
|
2015-08-12 09:16:07 +00:00
|
|
|
function hook_article_filter_action($article, $action) {
|
|
|
|
return $this->process_article($article);
|
|
|
|
}
|
2015-07-06 20:02:21 +00:00
|
|
|
|
2015-08-12 09:16:07 +00:00
|
|
|
function process_article($article) {
|
2015-07-06 20:02:21 +00:00
|
|
|
|
2015-07-08 10:44:45 +00:00
|
|
|
if (!class_exists("Readability")) require_once(dirname(dirname(__DIR__)). "/lib/readability/Readability.php");
|
2015-07-06 20:02:21 +00:00
|
|
|
|
2015-11-20 10:34:52 +00:00
|
|
|
if (!defined('NO_CURL') && function_exists('curl_init') && !ini_get("open_basedir")) {
|
|
|
|
|
2015-07-08 07:35:19 +00:00
|
|
|
$ch = curl_init($article["link"]);
|
2015-11-20 10:34:52 +00:00
|
|
|
|
2015-07-08 07:35:19 +00:00
|
|
|
curl_setopt($ch, CURLOPT_TIMEOUT, 5);
|
|
|
|
curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1);
|
|
|
|
curl_setopt($ch, CURLOPT_HEADER, true);
|
|
|
|
curl_setopt($ch, CURLOPT_NOBODY, true);
|
2015-11-20 10:34:52 +00:00
|
|
|
curl_setopt($ch, CURLOPT_FOLLOWLOCATION, true);
|
2015-07-08 07:35:19 +00:00
|
|
|
curl_setopt($ch, CURLOPT_USERAGENT, SELF_USER_AGENT);
|
|
|
|
|
|
|
|
@$result = curl_exec($ch);
|
|
|
|
$content_type = curl_getinfo($ch, CURLINFO_CONTENT_TYPE);
|
|
|
|
|
|
|
|
if (strpos($content_type, "text/html") === FALSE)
|
|
|
|
return $article;
|
|
|
|
}
|
|
|
|
|
2015-07-06 20:02:21 +00:00
|
|
|
$tmp = fetch_file_contents($article["link"]);
|
|
|
|
|
2015-10-06 11:12:22 +00:00
|
|
|
if ($tmp && mb_strlen($tmp) < 65535 * 4) {
|
2015-07-07 07:15:08 +00:00
|
|
|
$tmpdoc = new DOMDocument("1.0", "UTF-8");
|
2015-07-08 07:35:19 +00:00
|
|
|
|
|
|
|
if (!$tmpdoc->loadHTML($tmp))
|
|
|
|
return $article;
|
2015-07-07 07:15:08 +00:00
|
|
|
|
2015-07-13 16:24:59 +00:00
|
|
|
if (strtolower($tmpdoc->encoding) != 'utf-8') {
|
2015-07-07 07:15:08 +00:00
|
|
|
$tmpxpath = new DOMXPath($tmpdoc);
|
|
|
|
|
|
|
|
foreach ($tmpxpath->query("//meta") as $elem) {
|
|
|
|
$elem->parentNode->removeChild($elem);
|
|
|
|
}
|
|
|
|
|
|
|
|
$tmp = $tmpdoc->saveHTML();
|
|
|
|
}
|
|
|
|
|
2015-07-06 20:02:21 +00:00
|
|
|
$r = new Readability($tmp, $article["link"]);
|
|
|
|
|
|
|
|
if ($r->init()) {
|
2015-07-06 20:29:00 +00:00
|
|
|
|
|
|
|
$tmpxpath = new DOMXPath($r->dom);
|
|
|
|
|
|
|
|
$entries = $tmpxpath->query('(//a[@href]|//img[@src])');
|
|
|
|
|
|
|
|
foreach ($entries as $entry) {
|
|
|
|
if ($entry->hasAttribute("href")) {
|
|
|
|
$entry->setAttribute("href",
|
2015-07-06 20:38:02 +00:00
|
|
|
rewrite_relative_url($article["link"], $entry->getAttribute("href")));
|
2015-07-06 20:29:00 +00:00
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($entry->hasAttribute("src")) {
|
|
|
|
$entry->setAttribute("src",
|
2015-07-06 20:38:02 +00:00
|
|
|
rewrite_relative_url($article["link"], $entry->getAttribute("src")));
|
2015-07-06 20:29:00 +00:00
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2015-07-06 20:02:21 +00:00
|
|
|
$article["content"] = $r->articleContent->innerHTML;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return $article;
|
2015-08-12 09:16:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
function hook_article_filter($article) {
|
|
|
|
|
|
|
|
$enabled_feeds = $this->host->get($this, "enabled_feeds");
|
|
|
|
$key = array_search($article["feed"]["id"], $enabled_feeds);
|
|
|
|
if ($key === FALSE) return $article;
|
|
|
|
|
|
|
|
return $this->process_article($article);
|
2015-07-06 20:02:21 +00:00
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
function api_version() {
|
|
|
|
return 2;
|
|
|
|
}
|
|
|
|
|
|
|
|
private function filter_unknown_feeds($enabled_feeds) {
|
|
|
|
$tmp = array();
|
|
|
|
|
|
|
|
foreach ($enabled_feeds as $feed) {
|
|
|
|
|
|
|
|
$result = db_query("SELECT id FROM ttrss_feeds WHERE id = '$feed' AND owner_uid = " . $_SESSION["uid"]);
|
|
|
|
|
|
|
|
if (db_num_rows($result) != 0) {
|
|
|
|
array_push($tmp, $feed);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return $tmp;
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
?>
|