]> git.wh0rd.org - tt-rss.git/blobdiff - update_daemon2.php
reinstate error handlers; better DB error reporting on failed queries
[tt-rss.git] / update_daemon2.php
old mode 100644 (file)
new mode 100755 (executable)
index 3721a09..6d13add
-#!/usr/bin/php
+#!/usr/bin/env php
 <?php
-       // This is an experimental multiprocess update daemon
-       // It consists of the master server (this file) and
-       // client batch script (update_daemon2_client.php) which
-       // should only be run by the server process
+       set_include_path(dirname(__FILE__) ."/include" . PATH_SEPARATOR .
+               get_include_path());
 
        declare(ticks = 1);
+       chdir(dirname(__FILE__));
 
-       require "config.php";
+       define('DISABLE_SESSIONS', true);
 
+       require_once "version.php";
+
+       if (strpos(VERSION, ".99") !== false || getenv('DAEMON_XDEBUG')) {
+               define('DAEMON_EXTENDED_DEBUG', true);
+       }
+
+       require_once "autoload.php";
+       require_once "functions.php";
+       require_once "rssfuncs.php";
+       require_once "sanity_check.php";
+       require_once "config.php";
+       require_once "db.php";
+       require_once "db-prefs.php";
+       require_once "errorhandler.php";
+
+       // defaults
+       define('PURGE_INTERVAL', 3600); // seconds
+       define('MAX_CHILD_RUNTIME', 600); // seconds
        define('MAX_JOBS', 2);
-       define('CLIENT_PROCESS', './update_daemon2_client.php SRV_RUN_OK');
-       define('SPAWN_INTERVAL', DAEMON_SLEEP_INTERVAL);
+       define('SPAWN_INTERVAL', DAEMON_SLEEP_INTERVAL); // seconds
+
+       if (!function_exists('pcntl_fork')) {
+               die("error: This script requires PHP compiled with PCNTL module.\n");
+       }
+
+       $master_handlers_installed = false;
+
+       $children = array();
+       $ctimes = array();
 
-       $running_jobs = 0;
        $last_checkpoint = -1;
 
+       function reap_children() {
+               global $children;
+               global $ctimes;
+
+               $tmp = array();
+
+               foreach ($children as $pid) {
+                       if (pcntl_waitpid($pid, $status, WNOHANG) != $pid) {
+
+                               if (file_is_locked("update_daemon-$pid.lock")) {
+                                       array_push($tmp, $pid);
+                               } else {
+                                       _debug("[reap_children] child $pid seems active but lockfile is unlocked.");
+                                       unset($ctimes[$pid]);
+
+                               }
+                       } else {
+                               _debug("[reap_children] child $pid reaped.");
+                               unset($ctimes[$pid]);
+                       }
+               }
+
+               $children = $tmp;
+
+               return count($tmp);
+       }
+
+       function check_ctimes() {
+               global $ctimes;
+
+               foreach (array_keys($ctimes) as $pid) {
+                       $started = $ctimes[$pid];
+
+                       if (time() - $started > MAX_CHILD_RUNTIME) {
+                               _debug("[MASTER] child process $pid seems to be stuck, aborting...");
+                               posix_kill($pid, SIGKILL);
+                       }
+               }
+       }
+
        function sigchld_handler($signal) {
-               global $running_jobs;
-               if ($running_jobs > 0) $running_jobs--;
-               print posix_getpid() . ": SIGCHLD received, jobs left: $running_jobs\n";
+               $running_jobs = reap_children();
+
+               _debug("[SIGCHLD] jobs left: $running_jobs");
+
                pcntl_waitpid(-1, $status, WNOHANG);
        }
 
+       function shutdown($caller_pid) {
+               if ($caller_pid == posix_getpid()) {
+                       if (file_exists(LOCK_DIRECTORY . "/update_daemon.lock")) {
+                               _debug("removing lockfile (master)...");
+                               unlink(LOCK_DIRECTORY . "/update_daemon.lock");
+                       }
+               }
+       }
+
+       function task_shutdown() {
+               $pid = posix_getpid();
+
+               if (file_exists(LOCK_DIRECTORY . "/update_daemon-$pid.lock")) {
+                       _debug("removing lockfile ($pid)...");
+                       unlink(LOCK_DIRECTORY . "/update_daemon-$pid.lock");
+               }
+       }
+
+       function sigint_handler() {
+               _debug("[MASTER] SIG_INT received.\n");
+               shutdown(posix_getpid());
+               die;
+       }
+
+       function task_sigint_handler() {
+               _debug("[TASK] SIG_INT received.\n");
+               task_shutdown();
+               die;
+       }
+
        pcntl_signal(SIGCHLD, 'sigchld_handler');
 
+       $longopts = array("log:",
+                       "tasks:",
+                       "interval:",
+                       "quiet",
+                       "help");
+
+       $options = getopt("", $longopts);
+
+       if (isset($options["help"]) ) {
+               print "Tiny Tiny RSS update daemon.\n\n";
+               print "Options:\n";
+               print "  --log FILE           - log messages to FILE\n";
+               print "  --tasks N            - amount of update tasks to spawn\n";
+               print "                         default: " . MAX_JOBS . "\n";
+               print "  --interval N         - task spawn interval\n";
+               print "                         default: " . SPAWN_INTERVAL . " seconds.\n";
+               print "  --quiet              - don't output messages to stdout\n";
+               return;
+       }
+
+       define('QUIET', isset($options['quiet']));
+
+       if (isset($options["tasks"])) {
+               _debug("Set to spawn " . $options["tasks"] . " children.");
+               $max_jobs = $options["tasks"];
+       } else {
+               $max_jobs = MAX_JOBS;
+       }
+
+       if (isset($options["interval"])) {
+               _debug("Spawn interval: " . $options["interval"] . " seconds.");
+               $spawn_interval = $options["interval"];
+       } else {
+               $spawn_interval = SPAWN_INTERVAL;
+       }
+
+       if (isset($options["log"])) {
+               _debug("Logging to " . $options["log"]);
+               define('LOGFILE', $options["log"]);
+       }
+
+       if (file_is_locked("update_daemon.lock")) {
+               die("error: Can't create lockfile. ".
+                       "Maybe another daemon is already running.\n");
+       }
+
+       // Try to lock a file in order to avoid concurrent update.
+       $lock_handle = make_lockfile("update_daemon.lock");
+
+       if (!$lock_handle) {
+               die("error: Can't create lockfile. ".
+                       "Maybe another daemon is already running.\n");
+       }
+
+       // Testing database connection.
+       // It is unnecessary to start the fork loop if database is not ok.
+       $link = db_connect(DB_HOST, DB_USER, DB_PASS, DB_NAME);
+
+       if (!init_plugins($link)) die("Can't initialize db connection.\n");
+
+       $schema_version = get_schema_version($link);
+
+       db_close($link);
+
+       if ($schema_version != SCHEMA_VERSION) {
+               die("Schema version is wrong, please upgrade the database.\n");
+       }
+
        while (true) {
 
-               $next_spawn = $last_checkpoint + SPAWN_INTERVAL - time();
+               // Since sleep is interupted by SIGCHLD, we need another way to
+               // respect the spawn interval
+               $next_spawn = $last_checkpoint + $spawn_interval - time();
+
+               if ($next_spawn % 60 == 0) {
+                       $running_jobs = count($children);
+                       _debug("[MASTER] active jobs: $running_jobs, next spawn at $next_spawn sec.");
+               }
+
+               if ($last_checkpoint + $spawn_interval < time()) {
 
-               print "[MASTER] active jobs: $running_jobs, next spawn at $next_spawn sec\n";
+                       /* Check if schema version changed */
 
-               if ($last_checkpoint + SPAWN_INTERVAL < time()) {
+                       $link = db_connect(DB_HOST, DB_USER, DB_PASS, DB_NAME);
+                       if (!init_plugins($link)) die("Can't initialize db connection.\n");
+                       $test_schema_version = get_schema_version($link);
+                       db_close($link);
 
-                       for ($j = $running_jobs; $j < MAX_JOBS; $j++) {
-                               print "[MASTER] spawning client $j...";
+                       if ($test_schema_version != $schema_version) {
+                               echo "Expected schema version: $schema_version, got: $test_schema_version\n";
+                               echo "Schema version changed while we were running, bailing out\n";
+                               exit(100);
+                       }
+
+                       check_ctimes();
+                       reap_children();
+
+                       for ($j = count($children); $j < $max_jobs; $j++) {
                                $pid = pcntl_fork();
                                if ($pid == -1) {
                                        die("fork failed!\n");
                                } else if ($pid) {
-                                       $running_jobs++;
-                                       print "OK [$running_jobs]\n";
+
+                                       if (!$master_handlers_installed) {
+                                               _debug("[MASTER] installing shutdown handlers");
+                                               pcntl_signal(SIGINT, 'sigint_handler');
+                                               register_shutdown_function('shutdown', posix_getpid());
+                                               $master_handlers_installed = true;
+                                       }
+
+                                       _debug("[MASTER] spawned client $j [PID:$pid]...");
+                                       array_push($children, $pid);
+                                       $ctimes[$pid] = time();
                                } else {
                                        pcntl_signal(SIGCHLD, SIG_IGN);
-                                       passthru(CLIENT_PROCESS);
+                                       pcntl_signal(SIGINT, 'task_sigint_handler');
+
+                                       register_shutdown_function('task_shutdown');
+
+                                       $my_pid = posix_getpid();
+                                       $lock_filename = "update_daemon-$my_pid.lock";
+
+                                       $lock_handle = make_lockfile($lock_filename);
+
+                                       if (!$lock_handle) {
+                                               die("error: Can't create lockfile ($lock_filename). ".
+                                               "Maybe another daemon is already running.\n");
+                                       }
+
+                                       // ****** Updating RSS code *******
+                                       // Only run in fork process.
+
+                                       $start_timestamp = time();
+
+                                       $link = db_connect(DB_HOST, DB_USER, DB_PASS, DB_NAME);
+
+                                       if (!init_plugins($link)) return;
+
+                                       // We disable stamp file, since it is of no use in a multiprocess update.
+                                       // not really, tho for the time being -fox
+                                       if (!make_stampfile('update_daemon.stamp')) {
+                                               _debug("warning: unable to create stampfile\n");
+                                       }
+
+                                       // Call to the feed batch update function
+                                       // and maybe regenerate feedbrowser cache
+
+                                       $nf = 0;
+
+                                       _debug("Waiting before update [$j]..");
+                                       sleep($j*5);
+                                       $nf = update_daemon_common($link);
+
+                                       if (rand(0,100) > 50) {
+                                               $count = update_feedbrowser_cache($link);
+                                               _debug("Feedbrowser updated, $count feeds processed.");
+
+                                               purge_orphans($link, true);
+
+                                               $rc = cleanup_tags($link, 14, 50000);
+
+                                               _debug("Cleaned $rc cached tags.");
+
+                                               global $pluginhost;
+                                               $pluginhost->run_hooks($pluginhost::HOOK_UPDATE_TASK, "hook_update_task", $op);
+                                       }
+
+                                       _debug("Elapsed time: " . (time() - $start_timestamp) . " second(s)");
+
+                                       if ($nf > 0) {
+                                               _debug("Feeds processed: $nf");
+
+                                               if (time() - $start_timestamp > 0) {
+                                                       _debug("Feeds/minute: " . sprintf("%.2d", $nf/((time()-$start_timestamp)/60)));
+                                               }
+                                       }
+
+                                       db_close($link);
+
+                                       // We are in a fork.
+                                       // We wait a little before exiting to avoid to be faster than our parent process.
+                                       sleep(1);
+
+                                       unlink(LOCK_DIRECTORY . "/$lock_filename");
+
+                                       // We exit in order to avoid fork bombing.
                                        exit(0);
                                }
                        }