]> git.wh0rd.org - tt-rss.git/blobdiff - update_daemon2.php
Merge pull request #131 from pictuga/patch-1
[tt-rss.git] / update_daemon2.php
index 1b9e57638eecfafe2b55858b5bbdb44d81db9001..37d6b40747adfc298c2dea96ab9162a7cc450d5b 100755 (executable)
@@ -1,12 +1,10 @@
-#!/usr/bin/php
+#!/usr/bin/env php
 <?php
-       // This is an experimental multiprocess update daemon.
-       // Some configurable variable may be found below.
-
-       // define('DEFAULT_ERROR_LEVEL', E_ALL);
-       define('DEFAULT_ERROR_LEVEL', E_ERROR | E_WARNING | E_PARSE);
+       set_include_path(dirname(__FILE__) ."/include" . PATH_SEPARATOR .
+               get_include_path());
 
        declare(ticks = 1);
+       chdir(dirname(__FILE__));
 
        define('DISABLE_SESSIONS', true);
 
                define('DAEMON_EXTENDED_DEBUG', true);
        }
 
-       define('PURGE_INTERVAL', 3600); // seconds
-       define('MAX_CHILD_RUNTIME', 600); // seconds
-
+       require_once "functions.php";
+       require_once "rssfuncs.php";
        require_once "sanity_check.php";
        require_once "config.php";
+       require_once "db.php";
+       require_once "db-prefs.php";
 
+       // defaults
+       define('PURGE_INTERVAL', 3600); // seconds
+       define('MAX_CHILD_RUNTIME', 600); // seconds
        define('MAX_JOBS', 2);
-       define('SPAWN_INTERVAL', DAEMON_SLEEP_INTERVAL);
+       define('SPAWN_INTERVAL', DAEMON_SLEEP_INTERVAL); // seconds
 
        if (!function_exists('pcntl_fork')) {
                die("error: This script requires PHP compiled with PCNTL module.\n");
        }
 
-       if (!ENABLE_UPDATE_DAEMON) {
-               die("error: Please enable option ENABLE_UPDATE_DAEMON in config.php\n");
-       }
-       
-       require_once "db.php";
-       require_once "db-prefs.php";
-       require_once "functions.php";
-       require_once "lib/magpierss/rss_fetch.inc";
-
-       error_reporting(DEFAULT_ERROR_LEVEL);
+       $master_handlers_installed = false;
 
        $children = array();
        $ctimes = array();
 
                foreach ($children as $pid) {
                        if (pcntl_waitpid($pid, $status, WNOHANG) != $pid) {
-                               array_push($tmp, $pid);
+
+                               if (file_is_locked("update_daemon-$pid.lock")) {
+                                       array_push($tmp, $pid);
+                               } else {
+                                       _debug("[reap_children] child $pid seems active but lockfile is unlocked.");
+                                       unset($ctimes[$pid]);
+
+                               }
                        } else {
-                               _debug("[SIGCHLD] child $pid reaped.");
+                               _debug("[reap_children] child $pid reaped.");
                                unset($ctimes[$pid]);
                        }
                }
@@ -67,7 +67,7 @@
 
        function check_ctimes() {
                global $ctimes;
-               
+
                foreach (array_keys($ctimes) as $pid) {
                        $started = $ctimes[$pid];
 
                pcntl_waitpid(-1, $status, WNOHANG);
        }
 
+       function shutdown($caller_pid) {
+               if ($caller_pid == posix_getpid()) {
+                       if (file_exists(LOCK_DIRECTORY . "/update_daemon.lock")) {
+                               _debug("removing lockfile (master)...");
+                               unlink(LOCK_DIRECTORY . "/update_daemon.lock");
+                       }
+               }
+       }
+
+       function task_shutdown() {
+               $pid = posix_getpid();
+
+               if (file_exists(LOCK_DIRECTORY . "/update_daemon-$pid.lock")) {
+                       _debug("removing lockfile ($pid)...");
+                       unlink(LOCK_DIRECTORY . "/update_daemon-$pid.lock");
+               }
+       }
+
        function sigint_handler() {
-               unlink(LOCK_DIRECTORY . "/update_daemon.lock");
-               die("[SIGINT] removing lockfile and exiting.\n");
+               _debug("[MASTER] SIG_INT received.\n");
+               shutdown(posix_getpid());
+               die;
+       }
+
+       function task_sigint_handler() {
+               _debug("[TASK] SIG_INT received.\n");
+               task_shutdown();
+               die;
        }
 
        pcntl_signal(SIGCHLD, 'sigchld_handler');
 
+       $longopts = array("log:",
+                       "tasks:",
+                       "interval:",
+                       "quiet",
+                       "help");
+
+       $options = getopt("", $longopts);
+
+       if (isset($options["help"]) ) {
+               print "Tiny Tiny RSS update daemon.\n\n";
+               print "Options:\n";
+               print "  --log FILE           - log messages to FILE\n";
+               print "  --tasks N            - amount of update tasks to spawn\n";
+               print "                         default: " . MAX_JOBS . "\n";
+               print "  --interval N         - task spawn interval\n";
+               print "                         default: " . SPAWN_INTERVAL . " seconds.\n";
+               print "  --quiet              - don't output messages to stdout\n";
+               return;
+       }
+
+       define('QUIET', isset($options['quiet']));
+
+       if (isset($options["tasks"])) {
+               _debug("Set to spawn " . $options["tasks"] . " children.");
+               $max_jobs = $options["tasks"];
+       } else {
+               $max_jobs = MAX_JOBS;
+       }
+
+       if (isset($options["interval"])) {
+               _debug("Spawn interval: " . $options["interval"] . " seconds.");
+               $spawn_interval = $options["interval"];
+       } else {
+               $spawn_interval = SPAWN_INTERVAL;
+       }
+
+       if (isset($options["log"])) {
+               _debug("Logging to " . $options["log"]);
+               define('LOGFILE', $options["log"]);
+       }
+
        if (file_is_locked("update_daemon.lock")) {
                die("error: Can't create lockfile. ".
                        "Maybe another daemon is already running.\n");
        }
 
-       if (!pcntl_fork()) {
-               pcntl_signal(SIGINT, 'sigint_handler');
-
-               // Try to lock a file in order to avoid concurrent update.
-               $lock_handle = make_lockfile("update_daemon.lock");
+       // Try to lock a file in order to avoid concurrent update.
+       $lock_handle = make_lockfile("update_daemon.lock");
 
-               if (!$lock_handle) {
-                       die("error: Can't create lockfile. ".
-                               "Maybe another daemon is already running.\n");
-               }
-
-               while (true) { sleep(100); }
+       if (!$lock_handle) {
+               die("error: Can't create lockfile. ".
+                       "Maybe another daemon is already running.\n");
        }
 
        // Testing database connection.
        // It is unnecessary to start the fork loop if database is not ok.
-       $link = db_connect(DB_HOST, DB_USER, DB_PASS, DB_NAME); 
+       $link = db_connect(DB_HOST, DB_USER, DB_PASS, DB_NAME);
 
-       if (!$link) {
-               if (DB_TYPE == "mysql") {
-                       print mysql_error();
-               }
-               // PG seems to display its own errors just fine by default.             
-               return;
-       }
+       if (!init_connection($link)) die("Can't initialize db connection.\n");
+
+       $schema_version = get_schema_version($link);
 
        db_close($link);
 
        while (true) {
 
                // Since sleep is interupted by SIGCHLD, we need another way to
-               // respect the SPAWN_INTERVAL
-               $next_spawn = $last_checkpoint + SPAWN_INTERVAL - time();
+               // respect the spawn interval
+               $next_spawn = $last_checkpoint + $spawn_interval - time();
 
-               if ($next_spawn % 10 == 0) {
+               if ($next_spawn % 60 == 0) {
                        $running_jobs = count($children);
                        _debug("[MASTER] active jobs: $running_jobs, next spawn at $next_spawn sec.");
                }
 
-               if ($last_checkpoint + SPAWN_INTERVAL < time()) {
+               if ($last_checkpoint + $spawn_interval < time()) {
+
+                       /* Check if schema version changed */
+
+                       $link = db_connect(DB_HOST, DB_USER, DB_PASS, DB_NAME);
+                       if (!init_connection($link)) die("Can't initialize db connection.\n");
+                       $test_schema_version = get_schema_version($link);
+                       db_close($link);
+
+                       if ($test_schema_version != $schema_version) {
+                               echo "Expected schema version: $schema_version, got: $test_schema_version\n";
+                               echo "Schema version changed while we were running, bailing out\n";
+                               exit(100);
+                       }
 
                        check_ctimes();
                        reap_children();
 
-                       for ($j = count($children); $j < MAX_JOBS; $j++) {
+                       for ($j = count($children); $j < $max_jobs; $j++) {
                                $pid = pcntl_fork();
                                if ($pid == -1) {
                                        die("fork failed!\n");
                                } else if ($pid) {
+
+                                       if (!$master_handlers_installed) {
+                                               _debug("[MASTER] installing shutdown handlers");
+                                               pcntl_signal(SIGINT, 'sigint_handler');
+                                               register_shutdown_function('shutdown', posix_getpid());
+                                               $master_handlers_installed = true;
+                                       }
+
                                        _debug("[MASTER] spawned client $j [PID:$pid]...");
                                        array_push($children, $pid);
                                        $ctimes[$pid] = time();
                                } else {
                                        pcntl_signal(SIGCHLD, SIG_IGN);
-                                       pcntl_signal(SIGINT, SIG_DFL);
+                                       pcntl_signal(SIGINT, 'task_sigint_handler');
+
+                                       register_shutdown_function('task_shutdown');
+
+                                       $my_pid = posix_getpid();
+                                       $lock_filename = "update_daemon-$my_pid.lock";
+
+                                       $lock_handle = make_lockfile($lock_filename);
+
+                                       if (!$lock_handle) {
+                                               die("error: Can't create lockfile ($lock_filename). ".
+                                               "Maybe another daemon is already running.\n");
+                                       }
 
                                        // ****** Updating RSS code *******
                                        // Only run in fork process.
 
                                        $start_timestamp = time();
 
-                                       $link = db_connect(DB_HOST, DB_USER, DB_PASS, DB_NAME); 
-
-                                       if (!$link) {
-                                               if (DB_TYPE == "mysql") {
-                                                       print mysql_error();
-                                               }
-                                               // PG seems to display its own errors just fine by default.             
-                                               return;
-                                       }
+                                       $link = db_connect(DB_HOST, DB_USER, DB_PASS, DB_NAME);
 
-                                       init_connection($link);
+                                       if (!init_connection($link)) return;
 
                                        // We disable stamp file, since it is of no use in a multiprocess update.
                                        // not really, tho for the time being -fox
                                        if (!make_stampfile('update_daemon.stamp')) {
-                                               print "warning: unable to create stampfile";
-                                       }       
+                                               _debug("warning: unable to create stampfile\n");
+                                       }
+
+                                       // Call to the feed batch update function
+                                       // and maybe regenerate feedbrowser cache
 
-                                       // Call to the feed batch update function 
-                                       // or regenerate feedbrowser cache
+                                       $nf = 0;
+
+                                       _debug("Waiting before update [$j]..");
+                                       sleep($j*5);
+                                       $nf = update_daemon_common($link);
 
                                        if (rand(0,100) > 50) {
-                                               update_daemon_common($link);
-                                       } else {
                                                $count = update_feedbrowser_cache($link);
-                                               _debug("Finished, $count feeds processed.");
+                                               _debug("Feedbrowser updated, $count feeds processed.");
+
+                                               purge_orphans($link, true);
+
+                                               $rc = cleanup_tags($link, 14, 50000);
+
+                                               _debug("Cleaned $rc cached tags.");
+
+                                               global $pluginhost;
+                                               $pluginhost->run_hooks($pluginhost::HOOK_UPDATE_TASK, "hook_update_task", $op);
                                        }
 
                                        _debug("Elapsed time: " . (time() - $start_timestamp) . " second(s)");
+
+                                       if ($nf > 0) {
+                                               _debug("Feeds processed: $nf; feeds/minute: " . sprintf("%.2d", $nf/((time()-$start_timestamp)/60)));
+                                       }
+
                                        db_close($link);
 
                                        // We are in a fork.
                                        // We wait a little before exiting to avoid to be faster than our parent process.
                                        sleep(1);
+
+                                       unlink(LOCK_DIRECTORY . "/$lock_filename");
+
                                        // We exit in order to avoid fork bombing.
                                        exit(0);
                                }
-
-                               // We wait a little time before the next fork, in order to let the first fork
-                               // mark the feeds it update :
-                               sleep(1);
                        }
                        $last_checkpoint = time();
                }