From e856ab9a09c74e621b2df5a7d325d71575f06b5e Mon Sep 17 00:00:00 2001 From: Michael Date: Sun, 27 Nov 2016 00:55:05 +0000 Subject: [PATCH 1/7] The worker can now run from the frontend as well --- boot.php | 4 + doc/htconfig.md | 1 + include/poller.php | 243 +++++++++++++++++++++++++++------------------ index.php | 4 + mod/worker.php | 38 +++++++ 5 files changed, 196 insertions(+), 94 deletions(-) create mode 100644 mod/worker.php diff --git a/boot.php b/boot.php index b44c063f8..866e7165c 100644 --- a/boot.php +++ b/boot.php @@ -1385,6 +1385,10 @@ class App { function proc_run($args) { + if (!function_exists("proc_open")) { + return; + } + // Add the php path if it is a php call if (count($args) && ($args[0] === 'php' OR !is_string($args[0]))) { diff --git a/doc/htconfig.md b/doc/htconfig.md index b6f98b2ef..8e0b89092 100644 --- a/doc/htconfig.md +++ b/doc/htconfig.md @@ -29,6 +29,7 @@ Example: To set the directory value please add this line to your .htconfig.php: * disable_email_validation (Boolean) - Disables the check if a mail address is in a valid format and can be resolved via DNS. * disable_url_validation (Boolean) - Disables the DNS lookup of an URL. * event_input_format - Default value is "ymd". +* frontend_worker (Boolean) - Activates the frontend worker which acts as a replacement for running the poller via the command line. * ignore_cache (Boolean) - For development only. Disables the item cache. * like_no_comment (Boolean) - Don't update the "commented" value of an item when it is liked. * local_block (Boolean) - Used in conjunction with "block_public". diff --git a/include/poller.php b/include/poller.php index 2e036247e..b4f5df4bf 100644 --- a/include/poller.php +++ b/include/poller.php @@ -15,7 +15,7 @@ use \Friendica\Core\PConfig; require_once("boot.php"); -function poller_run(&$argv, &$argc){ +function poller_run($argv, $argc){ global $a, $db; if(is_null($a)) { @@ -35,8 +35,6 @@ function poller_run(&$argv, &$argc){ $a->start_process(); - $mypid = getmypid(); - if ($a->max_processes_reached()) return; @@ -53,14 +51,7 @@ function poller_run(&$argv, &$argc){ } if(($argc <= 1) OR ($argv[1] != "no_cron")) { - // Run the cron job that calls all other jobs - proc_run(PRIORITY_MEDIUM, "include/cron.php"); - - // Run the cronhooks job separately from cron for being able to use a different timing - proc_run(PRIORITY_MEDIUM, "include/cronhooks.php"); - - // Cleaning dead processes - poller_kill_stale_workers(); + poller_run_cron(); } else // Sleep four seconds before checking for running processes again to avoid having too many workers sleep(4); @@ -69,95 +60,18 @@ function poller_run(&$argv, &$argc){ if (poller_too_much_workers()) return; - $cooldown = Config::get("system", "worker_cooldown", 0); - $starttime = time(); while ($r = poller_worker_process()) { - // Quit when in maintenance - if (get_config('system', 'maintenance', true)) - return; - - // Constantly check the number of parallel database processes - if ($a->max_processes_reached()) - return; - - // Constantly check the number of available database connections to let the frontend be accessible at any time - if (poller_max_connections_reached()) - return; - // Count active workers and compare them with a maximum value that depends on the load - if (poller_too_much_workers()) + if (poller_too_much_workers()) { return; - - $upd = q("UPDATE `workerqueue` SET `executed` = '%s', `pid` = %d WHERE `id` = %d AND `pid` = 0", - dbesc(datetime_convert()), - intval($mypid), - intval($r[0]["id"])); - - if (!$upd) { - logger("Couldn't update queue entry ".$r[0]["id"]." - skip this execution", LOGGER_DEBUG); - q("COMMIT"); - continue; } - // Assure that there are no tasks executed twice - $id = q("SELECT `pid`, `executed` FROM `workerqueue` WHERE `id` = %d", intval($r[0]["id"])); - if (!$id) { - logger("Queue item ".$r[0]["id"]." vanished - skip this execution", LOGGER_DEBUG); - q("COMMIT"); - continue; - } elseif ((strtotime($id[0]["executed"]) <= 0) OR ($id[0]["pid"] == 0)) { - logger("Entry for queue item ".$r[0]["id"]." wasn't stored - skip this execution", LOGGER_DEBUG); - q("COMMIT"); - continue; - } elseif ($id[0]["pid"] != $mypid) { - logger("Queue item ".$r[0]["id"]." is to be executed by process ".$id[0]["pid"]." and not by me (".$mypid.") - skip this execution", LOGGER_DEBUG); - q("COMMIT"); - continue; + if (!poller_execute($r[0])) { + return; } - q("COMMIT"); - - $argv = json_decode($r[0]["parameter"]); - - $argc = count($argv); - - // Check for existance and validity of the include file - $include = $argv[0]; - - if (!validate_include($include)) { - logger("Include file ".$argv[0]." is not valid!"); - q("DELETE FROM `workerqueue` WHERE `id` = %d", intval($r[0]["id"])); - continue; - } - - require_once($include); - - $funcname = str_replace(".php", "", basename($argv[0]))."_run"; - - if (function_exists($funcname)) { - logger("Process ".$mypid." - Prio ".$r[0]["priority"]." - ID ".$r[0]["id"].": ".$funcname." ".$r[0]["parameter"]); - - // For better logging create a new process id for every worker call - // But preserve the old one for the worker - $old_process_id = $a->process_id; - $a->process_id = uniqid("wrk", true); - - $funcname($argv, $argc); - - $a->process_id = $old_process_id; - - if ($cooldown > 0) { - logger("Process ".$mypid." - Prio ".$r[0]["priority"]." - ID ".$r[0]["id"].": ".$funcname." - in cooldown for ".$cooldown." seconds"); - sleep($cooldown); - } - - logger("Process ".$mypid." - Prio ".$r[0]["priority"]." - ID ".$r[0]["id"].": ".$funcname." - done"); - - q("DELETE FROM `workerqueue` WHERE `id` = %d", intval($r[0]["id"])); - } else - logger("Function ".$funcname." does not exist"); // Quit the poller once every hour if (time() > ($starttime + 3600)) @@ -166,6 +80,108 @@ function poller_run(&$argv, &$argc){ } +/** + * @brief Execute a worker entry + * + * @param array $queue Workerqueue entry + * + * @return boolean "true" if further processing should be stopped + */ +function poller_execute($queue) { + + $a = get_app(); + + $mypid = getmypid(); + + $cooldown = Config::get("system", "worker_cooldown", 0); + + // Quit when in maintenance + if (get_config('system', 'maintenance', true)) { + return false; + } + + // Constantly check the number of parallel database processes + if ($a->max_processes_reached()) { + return false; + } + + // Constantly check the number of available database connections to let the frontend be accessible at any time + if (poller_max_connections_reached()) { + return false; + } + + $upd = q("UPDATE `workerqueue` SET `executed` = '%s', `pid` = %d WHERE `id` = %d AND `pid` = 0", + dbesc(datetime_convert()), + intval($mypid), + intval($queue["id"])); + + if (!$upd) { + logger("Couldn't update queue entry ".$queue["id"]." - skip this execution", LOGGER_DEBUG); + q("COMMIT"); + return true; + } + + // Assure that there are no tasks executed twice + $id = q("SELECT `pid`, `executed` FROM `workerqueue` WHERE `id` = %d", intval($queue["id"])); + if (!$id) { + logger("Queue item ".$queue["id"]." vanished - skip this execution", LOGGER_DEBUG); + q("COMMIT"); + return true; + } elseif ((strtotime($id[0]["executed"]) <= 0) OR ($id[0]["pid"] == 0)) { + logger("Entry for queue item ".$queue["id"]." wasn't stored - skip this execution", LOGGER_DEBUG); + q("COMMIT"); + return true; + } elseif ($id[0]["pid"] != $mypid) { + logger("Queue item ".$queue["id"]." is to be executed by process ".$id[0]["pid"]." and not by me (".$mypid.") - skip this execution", LOGGER_DEBUG); + q("COMMIT"); + return true; + } + q("COMMIT"); + + $argv = json_decode($queue["parameter"]); + + $argc = count($argv); + + // Check for existance and validity of the include file + $include = $argv[0]; + + if (!validate_include($include)) { + logger("Include file ".$argv[0]." is not valid!"); + q("DELETE FROM `workerqueue` WHERE `id` = %d", intval($queue["id"])); + return true; + } + + require_once($include); + + $funcname = str_replace(".php", "", basename($argv[0]))."_run"; + + if (function_exists($funcname)) { + logger("Process ".$mypid." - Prio ".$queue["priority"]." - ID ".$queue["id"].": ".$funcname." ".$queue["parameter"]); + + // For better logging create a new process id for every worker call + // But preserve the old one for the worker + $old_process_id = $a->process_id; + $a->process_id = uniqid("wrk", true); + + $funcname($argv, $argc); + + $a->process_id = $old_process_id; + + if ($cooldown > 0) { + logger("Process ".$mypid." - Prio ".$queue["priority"]." - ID ".$queue["id"].": ".$funcname." - in cooldown for ".$cooldown." seconds"); + sleep($cooldown); + } + + logger("Process ".$mypid." - Prio ".$queue["priority"]." - ID ".$queue["id"].": ".$funcname." - done"); + + q("DELETE FROM `workerqueue` WHERE `id` = %d", intval($queue["id"])); + } else { + logger("Function ".$funcname." does not exist"); + } + + return true; +} + /** * @brief Checks if the number of database connections has reached a critical limit. * @@ -394,8 +410,7 @@ function poller_passing_slow(&$highest_priority) { $r = q("SELECT `priority` FROM `process` - INNER JOIN `workerqueue` ON `workerqueue`.`pid` = `process`.`pid` - WHERE `process`.`command` = 'poller.php'"); + INNER JOIN `workerqueue` ON `workerqueue`.`pid` = `process`.`pid`"); // No active processes at all? Fine if (!dbm::is_result($r)) @@ -435,7 +450,6 @@ function poller_passing_slow(&$highest_priority) { * * @return string SQL statement */ - function poller_worker_process() { q("START TRANSACTION;"); @@ -464,6 +478,47 @@ function poller_worker_process() { return $r; } +function call_worker() { + if (!get_config("system", "frontend_worker")) { + return; + } + + $url = get_app()->get_baseurl()."/worker"; + fetch_url($url, false, $redirects, 1); +} + +function call_worker_if_idle() { + if (!get_config("system", "frontend_worker")) { + return; + } + + poller_run_cron(); + + clear_worker_processes(); + + $workers = q("SELECT COUNT(*) AS `processes` FROM `process` WHERE `command` = 'worker.php'"); + + if ($workers[0]["processes"] == 0) { + call_worker(); + } +} + +function clear_worker_processes() { + q("DELETE FROM `process` WHERE `created` < '%s' AND `command` = 'worker.php'", + dbesc(datetime_convert('UTC','UTC',"now - 10 minutes"))); +} + +function poller_run_cron() { + // Run the cron job that calls all other jobs + proc_run(PRIORITY_MEDIUM, "include/cron.php"); + + // Run the cronhooks job separately from cron for being able to use a different timing + proc_run(PRIORITY_MEDIUM, "include/cronhooks.php"); + + // Cleaning dead processes + poller_kill_stale_workers(); +} + if (array_search(__file__,get_included_files())===0){ poller_run($_SERVER["argv"],$_SERVER["argc"]); diff --git a/index.php b/index.php index 13c3f6318..08f24af60 100644 --- a/index.php +++ b/index.php @@ -99,6 +99,10 @@ if (!$a->is_backend()) { $stamp1 = microtime(true); session_start(); $a->save_timestamp($stamp1, "parser"); +} else { + require_once "include/poller.php"; + + call_worker_if_idle(); } /** diff --git a/mod/worker.php b/mod/worker.php new file mode 100644 index 000000000..1d1ab2af3 --- /dev/null +++ b/mod/worker.php @@ -0,0 +1,38 @@ + Config::get("system", "worker_queues", 4)) { + return; + } + + $a->start_process(); + + logger("Front end worker started: ".getmypid()); + + call_worker(); + + if ($r = poller_worker_process()) { + poller_execute($r[0]); + } + + call_worker(); + + $a->end_process(); + + logger("Front end worker ended: ".getmypid()); + + killme(); +} From d71321c834bcb4191fb6e47ade2a00238f0f1044 Mon Sep 17 00:00:00 2001 From: Michael Date: Sun, 27 Nov 2016 01:11:22 +0000 Subject: [PATCH 2/7] Some added documentation --- include/poller.php | 24 ++++++++++++++++++++++++ 1 file changed, 24 insertions(+) diff --git a/include/poller.php b/include/poller.php index b4f5df4bf..f65134023 100644 --- a/include/poller.php +++ b/include/poller.php @@ -311,6 +311,11 @@ function poller_kill_stale_workers() { } } +/** + * @brief Checks if the number of active workers exceeds the given limits + * + * @return bool Are there too much workers running? + */ function poller_too_much_workers() { @@ -389,6 +394,11 @@ function poller_too_much_workers() { return($active >= $queues); } +/** + * @brief Returns the number of active poller processes + * + * @return integer Number of active poller processes + */ function poller_active_workers() { $workers = q("SELECT COUNT(*) AS `processes` FROM `process` WHERE `command` = 'poller.php'"); @@ -478,6 +488,9 @@ function poller_worker_process() { return $r; } +/** + * @brief Call the front end worker + */ function call_worker() { if (!get_config("system", "frontend_worker")) { return; @@ -487,6 +500,9 @@ function call_worker() { fetch_url($url, false, $redirects, 1); } +/** + * @brief Call the front end worker if there aren't any active + */ function call_worker_if_idle() { if (!get_config("system", "frontend_worker")) { return; @@ -503,11 +519,19 @@ function call_worker_if_idle() { } } +/** + * @brief Removes long running worker processes + */ function clear_worker_processes() { + /// @todo the 10 minutes needs to be configurable + /// Additionally we should clean up the corresponding workerqueue entries as well q("DELETE FROM `process` WHERE `created` < '%s' AND `command` = 'worker.php'", dbesc(datetime_convert('UTC','UTC',"now - 10 minutes"))); } +/** + * @brief Runs the cron processes + */ function poller_run_cron() { // Run the cron job that calls all other jobs proc_run(PRIORITY_MEDIUM, "include/cron.php"); From 636a0333646b0ca941a3eadaa246002001915303 Mon Sep 17 00:00:00 2001 From: Michael Date: Sun, 27 Nov 2016 09:02:08 +0000 Subject: [PATCH 3/7] Added documentation, config stuff, ... --- doc/htconfig.md | 1 + include/poller.php | 7 ++++--- mod/worker.php | 6 +++++- 3 files changed, 10 insertions(+), 4 deletions(-) diff --git a/doc/htconfig.md b/doc/htconfig.md index 8e0b89092..dbdbf1503 100644 --- a/doc/htconfig.md +++ b/doc/htconfig.md @@ -30,6 +30,7 @@ Example: To set the directory value please add this line to your .htconfig.php: * disable_url_validation (Boolean) - Disables the DNS lookup of an URL. * event_input_format - Default value is "ymd". * frontend_worker (Boolean) - Activates the frontend worker which acts as a replacement for running the poller via the command line. +* frontend_worker_timeout - Value in minutes after we think that a frontend task was killed by the webserver. Default value is 10. * ignore_cache (Boolean) - For development only. Disables the item cache. * like_no_comment (Boolean) - Don't update the "commented" value of an item when it is liked. * local_block (Boolean) - Used in conjunction with "block_public". diff --git a/include/poller.php b/include/poller.php index f65134023..b8e14a096 100644 --- a/include/poller.php +++ b/include/poller.php @@ -523,10 +523,11 @@ function call_worker_if_idle() { * @brief Removes long running worker processes */ function clear_worker_processes() { - /// @todo the 10 minutes needs to be configurable - /// Additionally we should clean up the corresponding workerqueue entries as well + $timeout = Config::get("system", "frontend_worker_timeout", 10); + + /// @todo We should clean up the corresponding workerqueue entries as well q("DELETE FROM `process` WHERE `created` < '%s' AND `command` = 'worker.php'", - dbesc(datetime_convert('UTC','UTC',"now - 10 minutes"))); + dbesc(datetime_convert('UTC','UTC',"now - ".$timeout." minutes"))); } /** diff --git a/mod/worker.php b/mod/worker.php index 1d1ab2af3..137579966 100644 --- a/mod/worker.php +++ b/mod/worker.php @@ -1,4 +1,8 @@ Date: Sun, 27 Nov 2016 10:01:24 +0000 Subject: [PATCH 4/7] Try to get more execution time --- mod/worker.php | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/mod/worker.php b/mod/worker.php index 137579966..3fb86dd5b 100644 --- a/mod/worker.php +++ b/mod/worker.php @@ -29,6 +29,11 @@ function worker_init($a){ call_worker(); if ($r = poller_worker_process()) { + + // On most configurations this parameter wouldn't have any effect. + // But since it doesn't destroy anything, we just try to get more execution time in any way. + set_time_limit(0); + poller_execute($r[0]); } From 80d221089513ed0301ea5c1cc2241b87d22a0767 Mon Sep 17 00:00:00 2001 From: Michael Date: Sun, 27 Nov 2016 20:57:18 +0000 Subject: [PATCH 5/7] We can now start the poller from a daemon as well. --- util/daemon.php | 96 +++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 96 insertions(+) create mode 100644 util/daemon.php diff --git a/util/daemon.php b/util/daemon.php new file mode 100644 index 000000000..d1eb70d8b --- /dev/null +++ b/util/daemon.php @@ -0,0 +1,96 @@ +config['php_path'])) { + $php = $a->config['php_path']; +} else { + $php = "php"; +} + +// Switch over to daemon mode. +if ($pid = pcntl_fork()) + return; // Parent + +fclose(STDIN); // Close all of the standard +fclose(STDOUT); // file descriptors as we +fclose(STDERR); // are running as a daemon. + +register_shutdown_function('shutdown'); + +if (posix_setsid() < 0) + return; + +if ($pid = pcntl_fork()) + return; // Parent + +$pid = getmypid(); +file_put_contents($pidfile, $pid); + +// Now running as a daemon. +while (true) { + // Call the poller + $cmdline = $php.' include/poller.php'; + + exec($cmdline); + + // Now sleep for 5 minutes + sleep(300); +} +?> From d96b827e3265edbcd1b5fbf59ca4071438622a1d Mon Sep 17 00:00:00 2001 From: Michael Date: Sun, 27 Nov 2016 22:52:21 +0000 Subject: [PATCH 6/7] Changed documentation --- util/daemon.php | 10 ++++++---- 1 file changed, 6 insertions(+), 4 deletions(-) diff --git a/util/daemon.php b/util/daemon.php index d1eb70d8b..e93306df1 100644 --- a/util/daemon.php +++ b/util/daemon.php @@ -1,8 +1,10 @@ Date: Sun, 27 Nov 2016 23:58:26 +0000 Subject: [PATCH 7/7] Set the time limit of the deamon. --- util/daemon.php | 3 +++ 1 file changed, 3 insertions(+) diff --git a/util/daemon.php b/util/daemon.php index e93306df1..266ddcd75 100644 --- a/util/daemon.php +++ b/util/daemon.php @@ -87,6 +87,9 @@ file_put_contents($pidfile, $pid); // Now running as a daemon. while (true) { + // Just to be sure that this script really runs endlessly + set_time_limit(0); + // Call the poller $cmdline = $php.' include/poller.php';