ttrss/functions.php

197 lines
5.0 KiB
PHP
Raw Normal View History

2005-08-21 15:35:22 +00:00
<?
require_once 'config.php';
2005-08-22 06:13:33 +00:00
function update_all_feeds($link, $fetch) {
2005-08-21 15:35:22 +00:00
pg_query("BEGIN");
2005-08-22 06:13:33 +00:00
if (!$fetch) {
$result = pg_query($link, "SELECT feed_url,id FROM ttrss_feeds WHERE
last_updated is null OR title = '' OR
EXTRACT(EPOCH FROM NOW()) - EXTRACT(EPOCH FROM last_updated) > " .
MIN_UPDATE_TIME);
} else {
$result = pg_query($link, "SELECT feed_url,id FROM ttrss_feeds");
}
2005-08-21 15:35:22 +00:00
2005-08-22 05:58:37 +00:00
$num_unread = 0;
2005-08-21 15:35:22 +00:00
while ($line = pg_fetch_assoc($result)) {
2005-08-22 05:58:37 +00:00
$num_unread += update_rss_feed($link, $line["feed_url"], $line["id"]);
2005-08-21 15:35:22 +00:00
}
pg_query("COMMIT");
2005-08-21 15:35:22 +00:00
}
function update_rss_feed($link, $feed_url, $feed) {
2005-08-23 06:46:25 +00:00
error_reporting(0);
2005-08-21 15:35:22 +00:00
$rss = fetch_rss($feed_url);
2005-08-23 06:46:25 +00:00
error_reporting (E_ERROR | E_WARNING | E_PARSE);
2005-08-22 05:58:37 +00:00
$num_unread = 0;
2005-08-21 15:35:22 +00:00
if ($rss) {
2005-08-22 04:56:40 +00:00
$result = pg_query("SELECT title FROM ttrss_feeds WHERE id = '$feed'");
$registered_title = pg_fetch_result($result, 0, "title");
if (!$registered_title) {
$feed_title = $rss->channel["title"];
pg_query("UPDATE ttrss_feeds SET title = '$feed_title' WHERE id = '$feed'");
}
2005-08-21 15:35:22 +00:00
pg_query("BEGIN");
2005-08-21 15:35:22 +00:00
foreach ($rss->items as $item) {
$entry_guid = $item["id"];
if (!$entry_guid) $entry_guid = $item["guid"];
if (!$entry_guid) $entry_guid = $item["link"];
2005-08-22 06:13:33 +00:00
$entry_timestamp = "";
2005-08-22 06:13:33 +00:00
$rss_2_date = $item['pubdate'];
$rss_1_date = $item['dc']['date'];
$atom_date = $item['issued'];
2005-08-22 09:04:38 +00:00
$no_orig_date = 'false';
2005-08-22 06:13:33 +00:00
if ($atom_date != "") $entry_timestamp = parse_w3cdtf($atom_date);
if ($rss_1_date != "") $entry_timestamp = parse_w3cdtf($rss_1_date);
if ($rss_2_date != "") $entry_timestamp = strtotime($rss_2_date);
// if ($rss_3_date != "") $entry_timestamp = strtotime($rss_3_date);
if ($entry_timestamp == "") {
$entry_timestamp = time();
$no_orig_date = 'true';
}
2005-08-22 09:04:38 +00:00
if (!$entry_timestamp) continue;
2005-08-22 03:20:00 +00:00
2005-08-21 15:35:22 +00:00
$entry_title = $item["title"];
$entry_link = $item["link"];
2005-08-22 03:20:00 +00:00
if (!$entry_title) continue;
if (!$entry_link) continue;
2005-08-21 15:35:22 +00:00
$entry_content = $item["description"];
if (!$entry_content) $entry_content = $item["content"];
if (!$entry_content) continue;
2005-08-21 15:35:22 +00:00
$entry_content = pg_escape_string($entry_content);
$entry_title = pg_escape_string($entry_title);
$content_md5 = md5($entry_content);
$result = pg_query($link, "
SELECT
id,unread,md5_hash,last_read,no_orig_date,title,
2005-08-22 09:04:38 +00:00
EXTRACT(EPOCH FROM updated) as updated_timestamp
2005-08-21 15:35:22 +00:00
FROM
ttrss_entries
WHERE
guid = '$entry_guid'");
2005-08-21 15:35:22 +00:00
if (pg_num_rows($result) == 0) {
$entry_timestamp = strftime("%Y/%m/%d %H:%M:%S", $entry_timestamp);
$query = "INSERT INTO ttrss_entries
(title, guid, link, updated, content, feed_id,
md5_hash, no_orig_date)
2005-08-21 15:35:22 +00:00
VALUES
('$entry_title', '$entry_guid', '$entry_link',
'$entry_timestamp', '$entry_content', '$feed',
'$content_md5', $no_orig_date)";
2005-08-21 15:35:22 +00:00
2005-08-22 05:58:37 +00:00
$result = pg_query($link, $query);
if ($result) ++$num_unread;
2005-08-21 15:35:22 +00:00
} else {
$entry_id = pg_fetch_result($result, 0, "id");
2005-08-22 09:04:38 +00:00
$updated_timestamp = pg_fetch_result($result, 0, "updated_timestamp");
$entry_timestamp_fmt = strftime("%Y/%m/%d %H:%M:%S", $entry_timestamp);
$last_read = pg_fetch_result($result, 0, "last_read");
2005-08-21 15:35:22 +00:00
$unread = pg_fetch_result($result, 0, "unread");
$md5_hash = pg_fetch_result($result, 0, "md5_hash");
$no_orig_date = pg_fetch_result($result, 0, "no_orig_date");
$orig_title = pg_fetch_result($result, 0, "title");
// disable update detection for posts which didn't have correct
// publishment date, because they will always register as updated
// sadly this doesn't catch feed generators which input current date
// in posts all the time (some planets do this)
if ($no_orig_date != 't' && (!$last_read || $md5_hash != $content_md5)) {
$last_read_qpart = 'last_read = null,';
} else {
$last_read_qpart = '';
}
// mark post as updated on title change
// maybe we should mark it as unread instead?
2005-08-22 09:04:38 +00:00
if ($orig_title != $entry_title) {
$last_read_qpart = 'last_read = null,';
}
// don't bother updating timestamps on posts with broken pubDate
if ($no_orig_date != 't') {
$update_timestamp_qpart = "updated = '$entry_timestamp_fmt',";
}
2005-08-22 09:04:38 +00:00
// print "$content_md5 vs $md5_hash [$entry_title vs $orig_title, $entry_id, $feed_id]<br>";
if ($content_md5 != $md5_hash) {
$update_md5_qpart = "md5_hash = '$content_md5',";
}
2005-08-21 15:35:22 +00:00
$query = "UPDATE ttrss_entries
SET
title ='$entry_title',
link = '$entry_link',
$update_timestamp_qpart
$last_read_qpart
$update_md5_qpart
2005-08-21 15:35:22 +00:00
content = '$entry_content',
unread = '$unread'
WHERE
id = '$entry_id'";
// print "<pre>".htmlspecialchars($query)."</pre>";
2005-08-21 15:35:22 +00:00
$result = pg_query($link, $query);
2005-08-22 05:58:37 +00:00
if ($result) ++$num_unread;
2005-08-21 15:35:22 +00:00
}
2005-08-21 15:35:22 +00:00
}
2005-08-22 05:58:37 +00:00
if ($result) {
$result = pg_query($link, "UPDATE ttrss_feeds SET last_updated = NOW()");
}
2005-08-21 15:35:22 +00:00
pg_query("COMMIT");
2005-08-21 15:35:22 +00:00
}
}
?>