2008-01-23 10:19:36 +01:00
|
|
|
#!/usr/bin/php
|
|
|
|
<?php
|
2008-01-23 17:19:32 +01:00
|
|
|
// This is an experimental multiprocess update daemon.
|
|
|
|
// Some configurable variable may be found below.
|
|
|
|
|
|
|
|
// define('DEFAULT_ERROR_LEVEL', E_ALL);
|
|
|
|
define('DEFAULT_ERROR_LEVEL', E_ERROR | E_WARNING | E_PARSE);
|
2008-01-23 10:19:36 +01:00
|
|
|
|
|
|
|
declare(ticks = 1);
|
|
|
|
|
2008-01-23 17:19:32 +01:00
|
|
|
define('MAGPIE_CACHE_DIR', '/var/tmp/magpie-ttrss-cache-daemon');
|
|
|
|
define('SIMPLEPIE_CACHE_DIR', '/var/tmp/simplepie-ttrss-cache-daemon');
|
|
|
|
define('DISABLE_SESSIONS', true);
|
2008-01-23 10:19:36 +01:00
|
|
|
|
|
|
|
define('MAX_JOBS', 2);
|
2008-01-23 17:19:32 +01:00
|
|
|
|
|
|
|
require_once "version.php";
|
|
|
|
|
2008-01-24 07:03:18 +01:00
|
|
|
if (strpos(VERSION, ".99") !== false || getenv('DAEMON_XDEBUG')) {
|
2008-01-23 17:19:32 +01:00
|
|
|
define('DAEMON_EXTENDED_DEBUG', true);
|
|
|
|
}
|
|
|
|
|
|
|
|
define('PURGE_INTERVAL', 3600); // seconds
|
|
|
|
|
|
|
|
require_once "sanity_check.php";
|
|
|
|
require_once "config.php";
|
|
|
|
|
2008-01-23 10:19:36 +01:00
|
|
|
define('SPAWN_INTERVAL', DAEMON_SLEEP_INTERVAL);
|
2008-01-23 17:19:32 +01:00
|
|
|
|
|
|
|
if (!ENABLE_UPDATE_DAEMON) {
|
|
|
|
die("Please enable option ENABLE_UPDATE_DAEMON in config.php\n");
|
|
|
|
}
|
|
|
|
|
|
|
|
require_once "db.php";
|
|
|
|
require_once "db-prefs.php";
|
|
|
|
require_once "functions.php";
|
|
|
|
require_once "magpierss/rss_fetch.inc";
|
|
|
|
|
|
|
|
error_reporting(DEFAULT_ERROR_LEVEL);
|
2008-01-23 10:19:36 +01:00
|
|
|
|
2008-01-24 09:43:22 +01:00
|
|
|
$children = array();
|
|
|
|
|
2008-01-23 10:19:36 +01:00
|
|
|
$last_checkpoint = -1;
|
|
|
|
|
2008-01-24 09:46:09 +01:00
|
|
|
function reap_children() {
|
2008-01-24 09:43:22 +01:00
|
|
|
global $children;
|
|
|
|
|
|
|
|
$tmp = array();
|
|
|
|
|
|
|
|
foreach ($children as $pid) {
|
|
|
|
if (pcntl_waitpid($pid, $status, WNOHANG) != $pid) {
|
|
|
|
array_push($tmp, $pid);
|
|
|
|
} else {
|
|
|
|
_debug("[SIGCHLD] child $pid reaped.");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
$children = $tmp;
|
|
|
|
|
2008-01-24 09:46:09 +01:00
|
|
|
return count($tmp);
|
|
|
|
}
|
|
|
|
|
|
|
|
function sigalrm_handler() {
|
|
|
|
die("received SIGALRM, hang in feed update?\n");
|
|
|
|
}
|
|
|
|
|
|
|
|
function sigchld_handler($signal) {
|
|
|
|
$running_jobs = reap_children();
|
2008-01-24 09:43:22 +01:00
|
|
|
|
|
|
|
_debug("[SIGCHLD] jobs left: $running_jobs");
|
2008-01-24 09:46:09 +01:00
|
|
|
|
2008-01-23 10:19:36 +01:00
|
|
|
pcntl_waitpid(-1, $status, WNOHANG);
|
|
|
|
}
|
|
|
|
|
2008-01-23 10:30:55 +01:00
|
|
|
function sigint_handler() {
|
|
|
|
unlink(LOCK_DIRECTORY . "/update_daemon.lock");
|
|
|
|
die("Received SIGINT. Exiting.\n");
|
|
|
|
}
|
|
|
|
|
2008-01-23 17:19:32 +01:00
|
|
|
pcntl_signal(SIGALRM, 'sigalrm_handler');
|
2008-01-23 10:19:36 +01:00
|
|
|
pcntl_signal(SIGCHLD, 'sigchld_handler');
|
2008-01-23 10:30:55 +01:00
|
|
|
|
2008-01-23 12:43:11 +01:00
|
|
|
if (file_is_locked("update_daemon.lock")) {
|
|
|
|
die("error: Can't create lockfile. ".
|
2008-01-23 10:30:55 +01:00
|
|
|
"Maybe another daemon is already running.\n");
|
|
|
|
}
|
2008-01-23 10:19:36 +01:00
|
|
|
|
2008-01-23 17:19:32 +01:00
|
|
|
if (file_is_locked("update_daemon.lock")) {
|
|
|
|
die("error: Can't create lockfile. ".
|
|
|
|
"Maybe another daemon is already running.\n");
|
|
|
|
}
|
|
|
|
|
2008-01-23 12:43:11 +01:00
|
|
|
if (!pcntl_fork()) {
|
2008-01-24 18:35:26 +01:00
|
|
|
pcntl_signal(SIGINT, 'sigint_handler');
|
|
|
|
|
2008-01-23 12:43:11 +01:00
|
|
|
$lock_handle = make_lockfile("update_daemon.lock");
|
|
|
|
|
|
|
|
if (!$lock_handle) {
|
|
|
|
die("error: Can't create lockfile. ".
|
|
|
|
"Maybe another daemon is already running.\n");
|
|
|
|
}
|
|
|
|
|
|
|
|
while (true) { sleep(100); }
|
|
|
|
}
|
|
|
|
|
2008-01-23 17:19:32 +01:00
|
|
|
// Testing database connection.
|
|
|
|
// It is unnecessary to start the fork loop if database is not ok.
|
|
|
|
$link = db_connect(DB_HOST, DB_USER, DB_PASS, DB_NAME);
|
|
|
|
|
|
|
|
if (!$link) {
|
|
|
|
if (DB_TYPE == "mysql") {
|
|
|
|
print mysql_error();
|
|
|
|
}
|
|
|
|
// PG seems to display its own errors just fine by default.
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
db_close($link);
|
|
|
|
|
|
|
|
|
2008-01-23 10:19:36 +01:00
|
|
|
while (true) {
|
|
|
|
|
|
|
|
$next_spawn = $last_checkpoint + SPAWN_INTERVAL - time();
|
|
|
|
|
2008-01-23 10:33:41 +01:00
|
|
|
if ($next_spawn % 10 == 0) {
|
2008-01-24 09:43:22 +01:00
|
|
|
$running_jobs = count($children);
|
|
|
|
_debug("[MASTER] active jobs: $running_jobs, next spawn at $next_spawn sec.");
|
2008-01-23 10:33:41 +01:00
|
|
|
}
|
2008-01-23 10:19:36 +01:00
|
|
|
|
|
|
|
if ($last_checkpoint + SPAWN_INTERVAL < time()) {
|
|
|
|
|
2008-01-24 09:46:09 +01:00
|
|
|
reap_children();
|
|
|
|
|
2008-01-24 09:43:22 +01:00
|
|
|
for ($j = count($children); $j < MAX_JOBS; $j++) {
|
2008-01-23 10:19:36 +01:00
|
|
|
$pid = pcntl_fork();
|
|
|
|
if ($pid == -1) {
|
|
|
|
die("fork failed!\n");
|
|
|
|
} else if ($pid) {
|
2008-01-24 09:43:22 +01:00
|
|
|
_debug("[MASTER] spawned client $j [PID:$pid]...");
|
|
|
|
array_push($children, $pid);
|
2008-01-23 10:19:36 +01:00
|
|
|
} else {
|
|
|
|
pcntl_signal(SIGCHLD, SIG_IGN);
|
2008-01-23 10:30:55 +01:00
|
|
|
pcntl_signal(SIGINT, SIG_DFL);
|
2008-01-23 17:19:32 +01:00
|
|
|
|
|
|
|
// ****** Updating RSS code *******
|
|
|
|
// Only run in fork process.
|
|
|
|
|
|
|
|
$start_timestamp = time();
|
|
|
|
|
|
|
|
$link = db_connect(DB_HOST, DB_USER, DB_PASS, DB_NAME);
|
|
|
|
|
|
|
|
if (!$link) {
|
|
|
|
if (DB_TYPE == "mysql") {
|
|
|
|
print mysql_error();
|
|
|
|
}
|
|
|
|
// PG seems to display its own errors just fine by default.
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (DB_TYPE == "pgsql") {
|
|
|
|
pg_query("set client_encoding = 'utf-8'");
|
|
|
|
pg_set_client_encoding("UNICODE");
|
|
|
|
} else {
|
|
|
|
if (defined('MYSQL_CHARSET') && MYSQL_CHARSET) {
|
|
|
|
db_query($link, "SET NAMES " . MYSQL_CHARSET);
|
|
|
|
// db_query($link, "SET CHARACTER SET " . MYSQL_CHARSET);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// We disable stamp file, since it is of no use in a multiprocess update.
|
|
|
|
// not really, tho for the time being -fox
|
|
|
|
if (!make_stampfile('update_daemon.stamp')) {
|
|
|
|
print "warning: unable to create stampfile";
|
|
|
|
}
|
|
|
|
|
|
|
|
// $last_purge = 0;
|
|
|
|
|
|
|
|
// if (time() - $last_purge > PURGE_INTERVAL) {
|
|
|
|
|
|
|
|
// FIXME : $last_purge is of no use in a multiprocess update.
|
|
|
|
// FIXME : We ALWAYS purge old posts.
|
|
|
|
_debug("Purging old posts (random 30 feeds)...");
|
|
|
|
global_purge_old_posts($link, true, 30);
|
|
|
|
|
|
|
|
// $last_purge = time();
|
|
|
|
// }
|
|
|
|
|
|
|
|
// Process all other feeds using last_updated and interval parameters
|
|
|
|
|
|
|
|
$random_qpart = sql_random_function();
|
|
|
|
|
|
|
|
if (DAEMON_UPDATE_LOGIN_LIMIT > 0) {
|
|
|
|
if (DB_TYPE == "pgsql") {
|
|
|
|
$login_thresh_qpart = "AND ttrss_users.last_login >= NOW() - INTERVAL '".DAEMON_UPDATE_LOGIN_LIMIT." days'";
|
|
|
|
} else {
|
|
|
|
$login_thresh_qpart = "AND ttrss_users.last_login >= DATE_SUB(NOW(), INTERVAL ".DAEMON_UPDATE_LOGIN_LIMIT." DAY)";
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
$login_thresh_qpart = "";
|
|
|
|
}
|
|
|
|
|
2008-01-24 18:35:26 +01:00
|
|
|
//if (DB_TYPE == "pgsql") {
|
|
|
|
// $update_limit_qpart = "AND ttrss_feeds.last_updated < NOW() - INTERVAL '".(DAEMON_SLEEP_INTERVAL*2)." seconds'";
|
|
|
|
//} else {
|
|
|
|
// $update_limit_qpart = "AND ttrss_feeds.last_updated < DATE_SUB(NOW(), INTERVAL ".(DAEMON_SLEEP_INTERVAL*2)." SECOND)";
|
|
|
|
//}
|
|
|
|
|
2008-01-23 17:19:32 +01:00
|
|
|
if (DB_TYPE == "pgsql") {
|
|
|
|
$update_limit_qpart = "AND ttrss_feeds.last_updated < NOW() - INTERVAL '".(DAEMON_SLEEP_INTERVAL*2)." seconds'";
|
2008-01-24 18:35:26 +01:00
|
|
|
$update_limit_qpart = "AND ((
|
|
|
|
ttrss_feeds.update_interval = 0
|
|
|
|
AND ttrss_feeds.last_updated < NOW() - INTERVAL ttrss_user_prefs.value || ' minutes'
|
|
|
|
) OR (
|
|
|
|
ttrss_feeds.update_interval > 0
|
|
|
|
AND ttrss_feeds.last_updated < NOW() - INTERVAL ttrss_feeds.update_interval || ' minutes'
|
|
|
|
))";
|
2008-01-23 17:19:32 +01:00
|
|
|
} else {
|
2008-01-24 18:35:26 +01:00
|
|
|
$update_limit_qpart = "AND ((
|
|
|
|
ttrss_feeds.update_interval = 0
|
|
|
|
AND ttrss_feeds.last_updated < DATE_SUB(NOW(), INTERVAL CONVERT(ttrss_user_prefs.value, SIGNED INTEGER) MINUTE)
|
|
|
|
) OR (
|
|
|
|
ttrss_feeds.update_interval > 0
|
|
|
|
AND ttrss_feeds.last_updated < DATE_SUB(NOW(), INTERVAL ttrss_feeds.update_interval MINUTE)
|
|
|
|
))";
|
2008-01-23 17:19:32 +01:00
|
|
|
}
|
|
|
|
|
2008-01-24 18:35:26 +01:00
|
|
|
|
2008-01-23 17:19:32 +01:00
|
|
|
if (DB_TYPE == "pgsql") {
|
2008-01-24 18:35:26 +01:00
|
|
|
$updstart_thresh_qpart = "AND (ttrss_feeds.last_update_started IS NULL OR ttrss_feeds.last_update_started < NOW() - INTERVAL '120 seconds')";
|
|
|
|
} else {
|
|
|
|
$updstart_thresh_qpart = "AND (ttrss_feeds.last_update_started IS NULL OR ttrss_feeds.last_update_started < DATE_SUB(NOW(), INTERVAL 120 SECOND))";
|
|
|
|
}
|
2008-01-23 17:19:32 +01:00
|
|
|
|
2008-01-24 18:35:26 +01:00
|
|
|
$result = db_query($link, "SELECT ttrss_feeds.feed_url,ttrss_feeds.id, ttrss_feeds.owner_uid,
|
|
|
|
SUBSTRING(ttrss_feeds.last_updated,1,19) AS last_updated,
|
|
|
|
ttrss_feeds.update_interval
|
2008-01-23 17:19:32 +01:00
|
|
|
FROM
|
2008-01-24 18:35:26 +01:00
|
|
|
ttrss_feeds, ttrss_users, ttrss_user_prefs
|
|
|
|
WHERE
|
|
|
|
ttrss_feeds.owner_uid = ttrss_users.id
|
|
|
|
AND ttrss_users.id = ttrss_user_prefs.owner_uid
|
|
|
|
AND ttrss_user_prefs.pref_name='DEFAULT_UPDATE_INTERVAL'
|
|
|
|
$login_thresh_qpart $update_limit_qpart
|
|
|
|
$updstart_thresh_qpart
|
2008-01-23 17:19:32 +01:00
|
|
|
ORDER BY $random_qpart DESC LIMIT " . DAEMON_FEED_LIMIT);
|
|
|
|
|
|
|
|
$user_prefs_cache = array();
|
|
|
|
|
|
|
|
_debug(sprintf("Scheduled %d feeds to update...\n", db_num_rows($result)));
|
|
|
|
|
|
|
|
// Here is a little cache magic in order to minimize risk of double feed updates.
|
|
|
|
$feeds_to_update = array();
|
|
|
|
while ($line = db_fetch_assoc($result)) {
|
|
|
|
$feeds_to_update[$line['id']] = $line;
|
|
|
|
}
|
|
|
|
|
|
|
|
// We update the feed last update started date before anything else.
|
|
|
|
// There is no lag due to feed contents downloads
|
|
|
|
// It prevent an other process to update the same feed.
|
|
|
|
$feed_ids = array_keys($feeds_to_update);
|
|
|
|
if($feed_ids) {
|
|
|
|
db_query($link, sprintf("UPDATE ttrss_feeds SET last_update_started = NOW()
|
|
|
|
WHERE id IN (%s)", implode(',', $feed_ids)));
|
|
|
|
}
|
|
|
|
|
|
|
|
while ($line = array_pop($feeds_to_update)) {
|
|
|
|
|
|
|
|
_debug("Feed: " . $line["feed_url"] . ", " . $line["last_updated"]);
|
|
|
|
|
2008-01-24 18:35:26 +01:00
|
|
|
pcntl_alarm(300);
|
|
|
|
update_rss_feed($link, $line["feed_url"], $line["id"], true);
|
|
|
|
pcntl_alarm(0);
|
2008-01-23 17:19:32 +01:00
|
|
|
|
2008-01-24 18:35:26 +01:00
|
|
|
sleep(1); // prevent flood (FIXME make this an option?)
|
2008-01-23 17:19:32 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if (DAEMON_SENDS_DIGESTS) send_headlines_digests($link);
|
|
|
|
|
2008-01-24 18:35:26 +01:00
|
|
|
_debug("Elapsed time: " . (time() - $start_timestamp) . " second(s)");
|
2008-01-23 17:19:32 +01:00
|
|
|
|
|
|
|
db_close($link);
|
|
|
|
|
|
|
|
// We are in a fork.
|
|
|
|
// We wait a little before exiting to avoid to be faster than our parent process.
|
|
|
|
sleep(1);
|
|
|
|
// We exit in order to avoid fork bombing.
|
2008-01-23 10:19:36 +01:00
|
|
|
exit(0);
|
|
|
|
}
|
2008-01-24 18:35:26 +01:00
|
|
|
|
|
|
|
// We wait a little time before the next fork, in order to let the first fork
|
|
|
|
// mark the feeds it update :
|
|
|
|
sleep(1);
|
2008-01-23 10:19:36 +01:00
|
|
|
}
|
|
|
|
$last_checkpoint = time();
|
|
|
|
}
|
|
|
|
sleep(1);
|
|
|
|
}
|
|
|
|
|
|
|
|
?>
|