friendica-github/src/Core/Worker.php

1660 lines
50 KiB
PHP
Raw Normal View History

<?php
/**
2022-01-02 08:27:47 +01:00
* @copyright Copyright (C) 2010-2022, the Friendica project
2020-02-09 15:45:36 +01:00
*
* @license GNU AGPL version 3 or any later version
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as
* published by the Free Software Foundation, either version 3 of the
* License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <https://www.gnu.org/licenses/>.
*
*/
2020-02-09 15:45:36 +01:00
namespace Friendica\Core;
2021-01-01 19:35:29 +00:00
use Friendica\App\Mode;
2021-10-24 20:43:59 +02:00
use Friendica\Core\Worker\Entity\Process;
use Friendica\Database\DBA;
use Friendica\DI;
use Friendica\Util\DateTimeFormat;
/**
2020-01-19 06:05:23 +00:00
* Contains the class for the worker background job processing
*/
class Worker
{
const STATE_STARTUP = 1; // Worker is in startup. This takes most time.
const STATE_LONG_LOOP = 2; // Worker is processing the whole - long - loop.
const STATE_REFETCH = 3; // Worker had refetched jobs in the execution loop.
const STATE_SHORT_LOOP = 4; // Worker is processing preassigned jobs, thus saving much time.
2019-02-27 06:55:04 +00:00
2020-10-24 08:05:03 +00:00
const FAST_COMMANDS = ['APDelivery', 'Delivery'];
2020-08-06 18:53:45 +00:00
const LOCK_PROCESS = 'worker_process';
const LOCK_WORKER = 'worker';
private static $up_start;
2019-02-09 23:10:15 +00:00
private static $db_duration = 0;
private static $db_duration_count = 0;
private static $db_duration_write = 0;
private static $db_duration_stat = 0;
private static $lock_duration = 0;
private static $last_update;
2019-02-27 06:55:04 +00:00
private static $state;
2021-01-02 08:43:55 +00:00
private static $daemon_mode = null;
/** @var Process */
2021-10-24 20:43:59 +02:00
private static $process;
/**
2020-01-19 06:05:23 +00:00
* Processes the tasks that are in the workerqueue table
*
* @param boolean $run_cron Should the cron processes be executed?
2021-10-24 20:43:59 +02:00
* @param Process $process The current running process
* @return void
2019-01-06 16:06:53 -05:00
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
*/
2021-10-24 20:43:59 +02:00
public static function processQueue($run_cron, Process $process)
{
self::$up_start = microtime(true);
2017-11-05 15:28:55 +00:00
// At first check the maximum load. We shouldn't continue with a high load
2021-10-24 20:43:59 +02:00
if (DI::system()->isMaxLoadReached()) {
2020-09-17 17:57:41 +00:00
Logger::notice('Pre check: maximum load reached, quitting.');
2017-11-05 15:28:55 +00:00
return;
}
// We now start the process. This is done after the load check since this could increase the load.
2021-10-24 20:43:59 +02:00
self::$process = $process;
2017-11-05 15:28:55 +00:00
// Kill stale processes every 5 minutes
$last_cleanup = DI::config()->get('system', 'worker_last_cleaned', 0);
if (time() > ($last_cleanup + 300)) {
DI::config()->set('system', 'worker_last_cleaned', time());
self::killStaleWorkers();
}
2020-08-19 18:21:40 +00:00
// Check if the system is ready
if (!self::isReady()) {
return;
}
// Now we start additional cron processes if we should do so
if ($run_cron) {
self::runCron();
}
$last_check = $starttime = time();
2019-02-27 06:55:04 +00:00
self::$state = self::STATE_STARTUP;
// We fetch the next queue entry that is about to be executed
2019-02-17 18:55:17 +00:00
while ($r = self::workerProcess()) {
2021-01-05 10:18:25 +00:00
if (self::IPCJobsExists(getmypid())) {
2021-01-05 16:01:05 +00:00
self::IPCDeleteJobState(getmypid());
2021-01-05 10:18:25 +00:00
}
2021-01-05 16:01:05 +00:00
2020-08-29 11:26:40 +00:00
// Don't refetch when a worker fetches tasks for multiple workers
$refetched = DI::config()->get('system', 'worker_multiple_fetch');
foreach ($r as $entry) {
$entry = self::checkPriority($entry);
// The work will be done
if (!self::execute($entry)) {
2020-12-31 20:14:13 +00:00
Logger::notice('Process execution failed, quitting.');
return;
}
// Trying to fetch new processes - but only once when successful
2020-08-06 18:53:45 +00:00
if (!$refetched && DI::lock()->acquire(self::LOCK_PROCESS, 0)) {
2019-02-17 18:55:17 +00:00
self::findWorkerProcesses();
2020-08-06 18:53:45 +00:00
DI::lock()->release(self::LOCK_PROCESS);
2019-02-27 06:55:04 +00:00
self::$state = self::STATE_REFETCH;
$refetched = true;
} else {
self::$state = self::STATE_SHORT_LOOP;
}
}
// To avoid the quitting of multiple workers only one worker at a time will execute the check
if ((time() > $last_check + 5) && !self::getWaitingJobForPID()) {
2019-02-27 06:55:04 +00:00
self::$state = self::STATE_LONG_LOOP;
2020-08-06 18:53:45 +00:00
if (DI::lock()->acquire(self::LOCK_WORKER, 0)) {
// Count active workers and compare them with a maximum value that depends on the load
if (self::tooMuchWorkers()) {
2020-12-31 20:14:13 +00:00
Logger::notice('Active worker limit reached, quitting.');
2020-08-06 18:53:45 +00:00
DI::lock()->release(self::LOCK_WORKER);
return;
}
// Check free memory
2021-10-24 20:43:59 +02:00
if (DI::system()->isMinMemoryReached()) {
2020-12-31 20:14:13 +00:00
Logger::warning('Memory limit reached, quitting.');
2020-08-06 18:53:45 +00:00
DI::lock()->release(self::LOCK_WORKER);
return;
}
2020-08-06 18:53:45 +00:00
DI::lock()->release(self::LOCK_WORKER);
}
$last_check = time();
}
// Quit the worker once every cron interval
if (time() > ($starttime + (DI::config()->get('system', 'cron_interval') * 60))) {
Logger::info('Process lifetime reached, respawning.');
2021-10-24 20:43:59 +02:00
self::unclaimProcess($process);
2021-01-05 10:18:25 +00:00
if (self::isDaemonMode()) {
self::IPCSetJobState(true);
} else {
self::spawnWorker();
}
return;
}
}
// Cleaning up. Possibly not needed, but it doesn't harm anything.
2021-01-02 08:43:55 +00:00
if (self::isDaemonMode()) {
self::IPCSetJobState(false);
}
2020-06-01 13:51:58 +00:00
Logger::info("Couldn't select a workerqueue entry, quitting process", ['pid' => getmypid()]);
}
/**
* Check and fix the priority of a worker task
* @param array $entry
* @return array
*/
private static function checkPriority(array $entry)
{
$entry['priority'] = (int)$entry['priority'];
if (!in_array($entry['priority'], PRIORITIES)) {
Logger::warning('Invalid priority', ['entry' => $entry, 'callstack' => System::callstack(20)]);
DBA::update('workerqueue', ['priority' => PRIORITY_MEDIUM], ['id' => $entry['id']]);
$entry['priority'] = PRIORITY_MEDIUM;
}
return $entry;
}
2020-08-19 18:21:40 +00:00
/**
* Checks if the system is ready.
*
* Several system parameters like memory, connections and processes are checked.
*
* @return boolean
*/
public static function isReady()
{
// Count active workers and compare them with a maximum value that depends on the load
if (self::tooMuchWorkers()) {
2020-12-31 20:14:13 +00:00
Logger::notice('Active worker limit reached, quitting.');
2020-08-19 18:21:40 +00:00
return false;
}
// Do we have too few memory?
2021-10-24 20:43:59 +02:00
if (DI::system()->isMinMemoryReached()) {
2020-12-31 20:14:13 +00:00
Logger::warning('Memory limit reached, quitting.');
2020-08-19 18:21:40 +00:00
return false;
}
// Possibly there are too much database connections
if (self::maxConnectionsReached()) {
2020-12-31 20:14:13 +00:00
Logger::warning('Maximum connections reached, quitting.');
2020-08-19 18:21:40 +00:00
return false;
}
// Possibly there are too much database processes that block the system
2021-10-24 20:43:59 +02:00
if (DI::system()->isMaxProcessesReached()) {
2020-12-31 20:14:13 +00:00
Logger::warning('Maximum processes reached, quitting.');
2020-08-19 18:21:40 +00:00
return false;
}
2021-01-02 08:43:55 +00:00
2020-08-19 18:21:40 +00:00
return true;
}
2019-02-09 23:10:15 +00:00
/**
2020-01-19 06:05:23 +00:00
* Check if non executed tasks do exist in the worker queue
2019-02-09 23:10:15 +00:00
*
* @return boolean Returns "true" if tasks are existing
* @throws \Exception
*/
2020-08-19 18:21:40 +00:00
public static function entriesExists()
2019-02-09 23:10:15 +00:00
{
$stamp = (float)microtime(true);
$exists = DBA::exists('workerqueue', ["NOT `done` AND `pid` = 0 AND `next_try` < ?", DateTimeFormat::utcNow()]);
self::$db_duration += (microtime(true) - $stamp);
return $exists;
}
/**
2020-01-19 06:05:23 +00:00
* Returns the number of deferred entries in the worker queue
*
* @return integer Number of deferred entries in the worker queue
2019-01-06 16:06:53 -05:00
* @throws \Exception
*/
private static function deferredEntries()
{
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
2019-08-13 06:43:08 +02:00
$count = DBA::count('workerqueue', ["NOT `done` AND `pid` = 0 AND `retrial` > ?", 0]);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_count += (microtime(true) - $stamp);
return $count;
}
/**
2020-01-19 06:05:23 +00:00
* Returns the number of non executed entries in the worker queue
*
* @return integer Number of non executed entries in the worker queue
2019-01-06 16:06:53 -05:00
* @throws \Exception
*/
private static function totalEntries()
{
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
$count = DBA::count('workerqueue', ['done' => false, 'pid' => 0]);
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_count += (microtime(true) - $stamp);
return $count;
}
/**
2020-01-19 06:05:23 +00:00
* Returns the highest priority in the worker queue that isn't executed
*
2017-11-19 21:47:21 +00:00
* @return integer Number of active worker processes
2019-01-06 16:06:53 -05:00
* @throws \Exception
*/
private static function highestPriority()
{
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
$condition = ["`pid` = 0 AND NOT `done` AND `next_try` < ?", DateTimeFormat::utcNow()];
$workerqueue = DBA::selectFirst('workerqueue', ['priority'], $condition, ['order' => ['priority']]);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
2018-07-21 08:46:04 -04:00
if (DBA::isResult($workerqueue)) {
2022-05-01 08:58:48 +00:00
return $workerqueue['priority'];
} else {
return 0;
}
}
/**
2020-01-19 06:05:23 +00:00
* Returns if a process with the given priority is running
*
* @param integer $priority The priority that should be checked
*
* @return integer Is there a process running with that priority?
2019-01-06 16:06:53 -05:00
* @throws \Exception
*/
private static function processWithPriorityActive($priority)
{
$condition = ["`priority` <= ? AND `pid` != 0 AND NOT `done`", $priority];
return DBA::exists('workerqueue', $condition);
}
/**
* Checks if the given file is valid to be included
*
* @param mixed $file
* @return bool
*/
private static function validateInclude(&$file)
{
$orig_file = $file;
$file = realpath($file);
if (strpos($file, getcwd()) !== 0) {
return false;
}
$file = str_replace(getcwd() . "/", "", $file, $count);
if ($count != 1) {
return false;
}
if ($orig_file !== $file) {
return false;
}
$valid = false;
if (strpos($file, "include/") === 0) {
$valid = true;
}
if (strpos($file, "addon/") === 0) {
$valid = true;
}
// Simply return flag
return $valid;
}
/**
2020-01-19 06:05:23 +00:00
* Execute a worker entry
*
* @param array $queue Workerqueue entry
*
* @return boolean "true" if further processing should be stopped
2019-01-06 16:06:53 -05:00
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
*/
public static function execute($queue)
{
$mypid = getmypid();
// Quit when in maintenance
if (DI::config()->get('system', 'maintenance', false, true)) {
2020-09-17 17:57:41 +00:00
Logger::notice("Maintenance mode - quit process", ['pid' => $mypid]);
return false;
}
// Constantly check the number of parallel database processes
2021-10-24 20:43:59 +02:00
if (DI::system()->isMaxProcessesReached()) {
2020-12-31 20:14:13 +00:00
Logger::warning("Max processes reached for process", ['pid' => $mypid]);
return false;
}
// Constantly check the number of available database connections to let the frontend be accessible at any time
if (self::maxConnectionsReached()) {
2020-12-31 20:14:13 +00:00
Logger::warning("Max connection reached for process", ['pid' => $mypid]);
return false;
}
2020-12-03 15:47:50 +00:00
$argv = json_decode($queue['parameter'], true);
if (!is_array($argv)) {
$argv = [];
}
2020-12-03 15:47:50 +00:00
if (!empty($queue['command'])) {
array_unshift($argv, $queue['command']);
}
2020-06-01 13:51:58 +00:00
if (empty($argv)) {
2020-09-17 17:57:41 +00:00
Logger::warning('Parameter is empty', ['queue' => $queue]);
2020-06-01 13:51:58 +00:00
return false;
}
// Check for existance and validity of the include file
$include = $argv[0];
if (method_exists(sprintf('Friendica\Worker\%s', $include), 'execute')) {
// We constantly update the "executed" date every minute to avoid being killed too soon
if (!isset(self::$last_update)) {
self::$last_update = strtotime($queue["executed"]);
}
$age = (time() - self::$last_update) / 60;
self::$last_update = time();
if ($age > 1) {
$stamp = (float)microtime(true);
DBA::update('workerqueue', ['executed' => DateTimeFormat::utcNow()], ['pid' => $mypid, 'done' => false]);
self::$db_duration += (microtime(true) - $stamp);
2019-02-09 23:10:15 +00:00
self::$db_duration_write += (microtime(true) - $stamp);
}
array_shift($argv);
self::execFunction($queue, $include, $argv, true);
$stamp = (float)microtime(true);
$condition = ["`id` = ? AND `next_try` < ?", $queue['id'], DateTimeFormat::utcNow()];
if (DBA::update('workerqueue', ['done' => true], $condition)) {
DI::config()->set('system', 'last_worker_execution', DateTimeFormat::utcNow());
}
self::$db_duration = (microtime(true) - $stamp);
2019-02-09 23:10:15 +00:00
self::$db_duration_write += (microtime(true) - $stamp);
return true;
}
// The script could be provided as full path or only with the function name
if ($include == basename($include)) {
2017-11-14 22:13:33 +00:00
$include = "include/".$include.".php";
}
if (!self::validateInclude($include)) {
2020-09-17 17:57:41 +00:00
Logger::warning("Include file is not valid", ['file' => $argv[0]]);
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
DBA::delete('workerqueue', ['id' => $queue["id"]]);
2019-02-09 23:10:15 +00:00
self::$db_duration = (microtime(true) - $stamp);
self::$db_duration_write += (microtime(true) - $stamp);
return true;
}
require_once $include;
$funcname = str_replace(".php", "", basename($argv[0]))."_run";
if (function_exists($funcname)) {
// We constantly update the "executed" date every minute to avoid being killed too soon
if (!isset(self::$last_update)) {
self::$last_update = strtotime($queue["executed"]);
}
$age = (time() - self::$last_update) / 60;
self::$last_update = time();
if ($age > 1) {
$stamp = (float)microtime(true);
DBA::update('workerqueue', ['executed' => DateTimeFormat::utcNow()], ['pid' => $mypid, 'done' => false]);
self::$db_duration += (microtime(true) - $stamp);
2019-02-09 23:10:15 +00:00
self::$db_duration_write += (microtime(true) - $stamp);
}
self::execFunction($queue, $funcname, $argv, false);
$stamp = (float)microtime(true);
if (DBA::update('workerqueue', ['done' => true], ['id' => $queue["id"]])) {
DI::config()->set('system', 'last_worker_execution', DateTimeFormat::utcNow());
}
self::$db_duration = (microtime(true) - $stamp);
2019-02-09 23:10:15 +00:00
self::$db_duration_write += (microtime(true) - $stamp);
} else {
2020-09-17 17:57:41 +00:00
Logger::warning("Function does not exist", ['function' => $funcname]);
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
DBA::delete('workerqueue', ['id' => $queue["id"]]);
2019-02-09 23:10:15 +00:00
self::$db_duration = (microtime(true) - $stamp);
self::$db_duration_write += (microtime(true) - $stamp);
}
return true;
}
/**
2020-01-19 06:05:23 +00:00
* Execute a function from the queue
*
* @param array $queue Workerqueue entry
* @param string $funcname name of the function
* @param array $argv Array of values to be passed to the function
* @param boolean $method_call boolean
* @return void
2019-01-06 16:06:53 -05:00
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
*/
private static function execFunction($queue, $funcname, $argv, $method_call)
{
2020-01-04 23:42:01 +01:00
$a = DI::app();
2021-01-02 19:33:50 +00:00
$cooldown = DI::config()->get("system", "worker_cooldown", 0);
if ($cooldown > 0) {
2022-05-01 08:58:48 +00:00
Logger::info('Pre execution cooldown.', ['priority' => $queue['priority'], 'id' => $queue["id"], 'cooldown' => $cooldown]);
2021-01-02 19:33:50 +00:00
sleep($cooldown);
}
Logger::enableWorker($funcname);
2022-05-01 08:58:48 +00:00
Logger::info("Process start.", ['priority' => $queue['priority'], 'id' => $queue["id"]]);
$stamp = (float)microtime(true);
// We use the callstack here to analyze the performance of executed worker entries.
// For this reason the variables have to be initialized.
DI::profiler()->reset();
2021-07-24 22:08:33 +00:00
$a->setQueue($queue);
2019-02-09 23:10:15 +00:00
$up_duration = microtime(true) - self::$up_start;
// Reset global data to avoid interferences
unset($_SESSION);
2019-02-22 20:41:13 +01:00
// Set the workerLogger as new default logger
if ($method_call) {
call_user_func_array(sprintf('Friendica\Worker\%s::execute', $funcname), $argv);
} else {
2020-06-01 13:51:58 +00:00
$funcname($argv, count($argv));
}
Logger::disableWorker();
2021-07-24 22:08:33 +00:00
$a->setQueue([]);
$duration = (microtime(true) - $stamp);
/* With these values we can analyze how effective the worker is.
* The database and rest time should be low since this is the unproductive time.
* The execution time is the productive time.
* By changing parameters like the maximum number of workers we can check the effectivness.
*/
$dbtotal = round(self::$db_duration, 2);
$dbread = round(self::$db_duration - (self::$db_duration_count + self::$db_duration_write + self::$db_duration_stat), 2);
$dbcount = round(self::$db_duration_count, 2);
$dbstat = round(self::$db_duration_stat, 2);
$dbwrite = round(self::$db_duration_write, 2);
$dblock = round(self::$lock_duration, 2);
$rest = round(max(0, $up_duration - (self::$db_duration + self::$lock_duration)), 2);
$exec = round($duration, 2);
2019-02-21 19:32:31 +00:00
Logger::info('Performance:', ['state' => self::$state, 'count' => $dbcount, 'stat' => $dbstat, 'write' => $dbwrite, 'lock' => $dblock, 'total' => $dbtotal, 'rest' => $rest, 'exec' => $exec]);
2019-02-09 23:10:15 +00:00
self::$up_start = microtime(true);
self::$db_duration = 0;
self::$db_duration_count = 0;
self::$db_duration_stat = 0;
self::$db_duration_write = 0;
self::$lock_duration = 0;
if ($duration > 3600) {
2022-05-01 08:58:48 +00:00
Logger::info('Longer than 1 hour.', ['priority' => $queue['priority'], 'id' => $queue["id"], 'duration' => round($duration/60, 3)]);
} elseif ($duration > 600) {
2022-05-01 08:58:48 +00:00
Logger::info('Longer than 10 minutes.', ['priority' => $queue['priority'], 'id' => $queue["id"], 'duration' => round($duration/60, 3)]);
} elseif ($duration > 300) {
2022-05-01 08:58:48 +00:00
Logger::info('Longer than 5 minutes.', ['priority' => $queue['priority'], 'id' => $queue["id"], 'duration' => round($duration/60, 3)]);
} elseif ($duration > 120) {
2022-05-01 08:58:48 +00:00
Logger::info('Longer than 2 minutes.', ['priority' => $queue['priority'], 'id' => $queue["id"], 'duration' => round($duration/60, 3)]);
}
2022-05-01 08:58:48 +00:00
Logger::info('Process done.', ['priority' => $queue['priority'], 'id' => $queue["id"], 'duration' => round($duration, 3)]);
DI::profiler()->saveLog(DI::logger(), "ID " . $queue["id"] . ": " . $funcname);
if ($cooldown > 0) {
2022-05-01 08:58:48 +00:00
Logger::info('Post execution cooldown.', ['priority' => $queue['priority'], 'id' => $queue["id"], 'cooldown' => $cooldown]);
sleep($cooldown);
}
}
/**
2020-01-19 06:05:23 +00:00
* Checks if the number of database connections has reached a critical limit.
*
* @return bool Are more than 3/4 of the maximum connections used?
2019-01-06 16:06:53 -05:00
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
*/
private static function maxConnectionsReached()
{
// Fetch the max value from the config. This is needed when the system cannot detect the correct value by itself.
$max = DI::config()->get("system", "max_connections");
2017-11-19 21:47:21 +00:00
// Fetch the percentage level where the worker will get active
$maxlevel = DI::config()->get("system", "max_connections_level", 75);
if ($max == 0) {
// the maximum number of possible user connections can be a system variable
$r = DBA::fetchFirst("SHOW VARIABLES WHERE `variable_name` = 'max_user_connections'");
2018-07-21 08:46:04 -04:00
if (DBA::isResult($r)) {
2017-11-05 17:13:37 +00:00
$max = $r["Value"];
}
// Or it can be granted. This overrides the system variable
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
$r = DBA::p('SHOW GRANTS');
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
while ($grants = DBA::fetch($r)) {
2017-11-05 17:13:37 +00:00
$grant = array_pop($grants);
if (stristr($grant, "GRANT USAGE ON")) {
if (preg_match("/WITH MAX_USER_CONNECTIONS (\d*)/", $grant, $match)) {
$max = $match[1];
}
}
}
DBA::close($r);
}
// If $max is set we will use the processlist to determine the current number of connections
// The processlist only shows entries of the current user
if ($max != 0) {
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
$r = DBA::p('SHOW PROCESSLIST');
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
2018-07-20 22:05:12 -04:00
$used = DBA::numRows($r);
DBA::close($r);
2020-06-01 13:51:58 +00:00
Logger::info("Connection usage (user values)", ['usage' => $used, 'max' => $max]);
$level = ($used / $max) * 100;
if ($level >= $maxlevel) {
2020-12-31 20:14:13 +00:00
Logger::warning("Maximum level (".$maxlevel."%) of user connections reached: ".$used."/".$max);
return true;
}
}
// We will now check for the system values.
// This limit could be reached although the user limits are fine.
$r = DBA::fetchFirst("SHOW VARIABLES WHERE `variable_name` = 'max_connections'");
2018-07-21 08:46:04 -04:00
if (!DBA::isResult($r)) {
return false;
}
2017-11-05 17:13:37 +00:00
$max = intval($r["Value"]);
if ($max == 0) {
return false;
}
$r = DBA::fetchFirst("SHOW STATUS WHERE `variable_name` = 'Threads_connected'");
2018-07-21 08:46:04 -04:00
if (!DBA::isResult($r)) {
return false;
}
2017-11-05 17:13:37 +00:00
$used = intval($r["Value"]);
if ($used == 0) {
return false;
}
2020-06-01 13:51:58 +00:00
Logger::info("Connection usage (system values)", ['used' => $used, 'max' => $max]);
$level = $used / $max * 100;
if ($level < $maxlevel) {
return false;
}
2020-12-31 20:14:13 +00:00
Logger::warning("Maximum level (".$level."%) of system connections reached: ".$used."/".$max);
return true;
}
/**
2020-01-19 06:05:23 +00:00
* fix the queue entry if the worker process died
2020-01-19 09:51:37 +00:00
*
* @return void
2019-01-06 16:06:53 -05:00
* @throws \Exception
*/
private static function killStaleWorkers()
{
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
$entries = DBA::select(
'workerqueue',
2020-12-03 15:47:50 +00:00
['id', 'pid', 'executed', 'priority', 'command', 'parameter'],
['NOT `done` AND `pid` != 0'],
2020-10-24 08:05:03 +00:00
['order' => ['priority', 'retrial', 'created']]
);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
while ($entry = DBA::fetch($entries)) {
$entry = self::checkPriority($entry);
if (!posix_kill($entry["pid"], 0)) {
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
DBA::update(
'workerqueue',
['executed' => DBA::NULL_DATETIME, 'pid' => 0],
['id' => $entry["id"]]
);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_write += (microtime(true) - $stamp);
} else {
// Kill long running processes
// Define the maximum durations
$max_duration_defaults = [PRIORITY_CRITICAL => 720, PRIORITY_HIGH => 10, PRIORITY_MEDIUM => 60, PRIORITY_LOW => 180, PRIORITY_NEGLIGIBLE => 720];
2022-05-01 08:58:48 +00:00
$max_duration = $max_duration_defaults[$entry['priority']];
2020-12-03 15:47:50 +00:00
$argv = json_decode($entry['parameter'], true);
if (!empty($entry['command'])) {
$command = $entry['command'];
} elseif (!empty($argv)) {
$command = array_shift($argv);
} else {
2020-06-01 13:51:58 +00:00
return;
}
2020-12-03 15:47:50 +00:00
$command = basename($command);
// How long is the process already running?
$duration = (time() - strtotime($entry["executed"])) / 60;
if ($duration > $max_duration) {
2020-12-03 15:47:50 +00:00
Logger::notice('Worker process took too much time - killed', ['duration' => number_format($duration, 3), 'max' => $max_duration, 'id' => $entry["id"], 'pid' => $entry["pid"], 'command' => $command]);
posix_kill($entry["pid"], SIGTERM);
// We killed the stale process.
// To avoid a blocking situation we reschedule the process at the beginning of the queue.
// Additionally we are lowering the priority. (But not PRIORITY_CRITICAL)
2022-05-01 08:58:48 +00:00
$new_priority = $entry['priority'];
if ($entry['priority'] == PRIORITY_HIGH) {
$new_priority = PRIORITY_MEDIUM;
2022-05-01 08:58:48 +00:00
} elseif ($entry['priority'] == PRIORITY_MEDIUM) {
$new_priority = PRIORITY_LOW;
2022-05-01 08:58:48 +00:00
} elseif ($entry['priority'] != PRIORITY_CRITICAL) {
$new_priority = PRIORITY_NEGLIGIBLE;
}
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
DBA::update(
'workerqueue',
['executed' => DBA::NULL_DATETIME, 'created' => DateTimeFormat::utcNow(), 'priority' => $new_priority, 'pid' => 0],
['id' => $entry["id"]]
);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_write += (microtime(true) - $stamp);
} else {
2020-12-03 15:47:50 +00:00
Logger::info('Process runtime is okay', ['duration' => number_format($duration, 3), 'max' => $max_duration, 'id' => $entry["id"], 'pid' => $entry["pid"], 'command' => $command]);
}
}
}
2020-04-28 05:55:17 +00:00
DBA::close($entries);
}
/**
2020-01-19 06:05:23 +00:00
* Checks if the number of active workers exceeds the given limits
*
* @return bool Are there too much workers running?
2019-01-06 16:06:53 -05:00
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
*/
2019-02-17 18:55:17 +00:00
private static function tooMuchWorkers()
{
$queues = DI::config()->get("system", "worker_queues", 10);
$maxqueues = $queues;
$active = self::activeWorkers();
// Decrease the number of workers at higher load
$load = System::currentLoad();
if ($load) {
$maxsysload = intval(DI::config()->get("system", "maxloadavg", 20));
/* Default exponent 3 causes queues to rapidly decrease as load increases.
* If you have 20 max queues at idle, then you get only 5 queues at 37.1% of $maxsysload.
* For some environments, this rapid decrease is not needed.
* With exponent 1, you could have 20 max queues at idle and 13 at 37% of $maxsysload.
*/
$exponent = intval(DI::config()->get('system', 'worker_load_exponent', 3));
2018-06-20 06:06:20 -04:00
$slope = pow(max(0, $maxsysload - $load) / $maxsysload, $exponent);
$queues = intval(ceil($slope * $maxqueues));
$processlist = '';
if (DI::config()->get('system', 'worker_jpm')) {
$intervals = explode(',', DI::config()->get('system', 'worker_jpm_range'));
$jobs_per_minute = [];
foreach ($intervals as $interval) {
2019-02-11 04:39:24 +00:00
if ($interval == 0) {
continue;
} else {
$interval = (int)$interval;
}
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
$jobs = DBA::count('workerqueue', ["`done` AND `executed` > ?", DateTimeFormat::utc('now - ' . $interval . ' minute')]);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
2019-02-17 19:20:24 +00:00
self::$db_duration_stat += (microtime(true) - $stamp);
$jobs_per_minute[$interval] = number_format($jobs / $interval, 0);
}
$processlist = ' - jpm: '.implode('/', $jobs_per_minute);
}
2019-02-09 23:10:15 +00:00
// Create a list of queue entries grouped by their priority
$listitem = [0 => ''];
2019-02-09 23:10:15 +00:00
$idle_workers = $active;
2019-02-17 18:55:17 +00:00
$deferred = self::deferredEntries();
2019-02-11 08:59:14 +00:00
if (DI::config()->get('system', 'worker_debug')) {
2019-02-11 08:59:14 +00:00
$waiting_processes = 0;
// Now adding all processes with workerqueue entries
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
2019-08-28 06:44:37 +02:00
$jobs = DBA::p("SELECT COUNT(*) AS `entries`, `priority` FROM `workerqueue` WHERE NOT `done` GROUP BY `priority`");
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_stat += (microtime(true) - $stamp);
while ($entry = DBA::fetch($jobs)) {
$stamp = (float)microtime(true);
2022-05-01 08:58:48 +00:00
$running = DBA::count('workerqueue-view', ['priority' => $entry['priority']]);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_stat += (microtime(true) - $stamp);
$idle_workers -= $running;
$waiting_processes += $entry["entries"];
2022-05-01 08:58:48 +00:00
$listitem[$entry['priority']] = $entry['priority'] . ":" . $running . "/" . $entry["entries"];
}
2019-02-09 23:10:15 +00:00
DBA::close($jobs);
} else {
2019-08-13 06:43:08 +02:00
$waiting_processes = self::totalEntries();
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
$jobs = DBA::p("SELECT COUNT(*) AS `running`, `priority` FROM `workerqueue-view` GROUP BY `priority` ORDER BY `priority`");
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
2019-02-17 18:55:17 +00:00
self::$db_duration_stat += (microtime(true) - $stamp);
2019-02-09 23:10:15 +00:00
while ($entry = DBA::fetch($jobs)) {
$idle_workers -= $entry["running"];
2022-05-01 08:58:48 +00:00
$listitem[$entry['priority']] = $entry['priority'].":".$entry["running"];
2019-02-09 23:10:15 +00:00
}
DBA::close($jobs);
}
$waiting_processes -= $deferred;
2019-02-09 23:10:15 +00:00
$listitem[0] = "0:" . max(0, $idle_workers);
$processlist .= ' ('.implode(', ', $listitem).')';
if (DI::config()->get("system", "worker_fastlane", false) && ($queues > 0) && ($active >= $queues) && self::entriesExists()) {
$top_priority = self::highestPriority();
$high_running = self::processWithPriorityActive($top_priority);
if (!$high_running && ($top_priority > PRIORITY_UNDEFINED) && ($top_priority < PRIORITY_NEGLIGIBLE)) {
2020-06-01 13:51:58 +00:00
Logger::info("Jobs with a higher priority are waiting but none is executed. Open a fastlane.", ['priority' => $top_priority]);
$queues = $active + 1;
}
}
Logger::notice("Load: " . $load ."/" . $maxsysload . " - processes: " . $deferred . "/" . $active . "/" . $waiting_processes . $processlist . " - maximum: " . $queues . "/" . $maxqueues);
// Are there fewer workers running as possible? Then fork a new one.
if (!DI::config()->get("system", "worker_dont_fork", false) && ($queues > ($active + 1)) && self::entriesExists()) {
2020-06-01 13:51:58 +00:00
Logger::info("There are fewer workers as possible, fork a new worker.", ['active' => $active, 'queues' => $queues]);
2021-01-02 08:43:55 +00:00
if (self::isDaemonMode()) {
self::IPCSetJobState(true);
} else {
self::spawnWorker();
}
}
}
// if there are too much worker, we don't spawn a new one.
2021-01-02 08:43:55 +00:00
if (self::isDaemonMode() && ($active > $queues)) {
self::IPCSetJobState(false);
}
return $active > $queues;
}
/**
2020-01-19 06:05:23 +00:00
* Returns the number of active worker processes
*
2017-11-19 21:47:21 +00:00
* @return integer Number of active worker processes
2019-01-06 16:06:53 -05:00
* @throws \Exception
*/
private static function activeWorkers()
{
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
2021-10-31 14:31:02 +01:00
$count = DI::process()->countCommand('Worker.php');
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_count += (microtime(true) - $stamp);
2019-02-09 23:10:15 +00:00
return $count;
}
/**
* Returns the number of active worker processes
*
* @return array List of worker process ids
* @throws \Exception
*/
private static function getWorkerPIDList()
{
$ids = [];
$stamp = (float)microtime(true);
$queues = DBA::p("SELECT `process`.`pid`, COUNT(`workerqueue`.`pid`) AS `entries` FROM `process`
2021-07-24 22:08:33 +00:00
LEFT JOIN `workerqueue` ON `workerqueue`.`pid` = `process`.`pid` AND NOT `workerqueue`.`done`
GROUP BY `process`.`pid`");
while ($queue = DBA::fetch($queues)) {
$ids[$queue['pid']] = $queue['entries'];
}
DBA::close($queues);
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_count += (microtime(true) - $stamp);
return $ids;
}
2019-02-17 19:20:24 +00:00
/**
2020-01-19 06:05:23 +00:00
* Returns waiting jobs for the current process id
2019-02-17 19:20:24 +00:00
*
* @return array waiting workerqueue jobs
* @throws \Exception
*/
2019-02-17 18:55:17 +00:00
private static function getWaitingJobForPID()
{
$stamp = (float)microtime(true);
$r = DBA::select('workerqueue', [], ['pid' => getmypid(), 'done' => false]);
self::$db_duration += (microtime(true) - $stamp);
if (DBA::isResult($r)) {
return DBA::toArray($r);
}
DBA::close($r);
return false;
}
2019-02-17 19:20:24 +00:00
/**
2020-01-19 06:05:23 +00:00
* Returns the next jobs that should be executed
* @param int $limit
2019-02-17 19:20:24 +00:00
* @return array array with next jobs
* @throws \Exception
*/
private static function nextProcess(int $limit)
2019-02-16 15:03:37 +00:00
{
$priority = self::nextPriority();
if (empty($priority)) {
2019-02-21 19:32:31 +00:00
Logger::info('No tasks found');
2019-02-16 15:03:37 +00:00
return [];
}
$ids = [];
$stamp = (float)microtime(true);
$condition = ["`priority` = ? AND `pid` = 0 AND NOT `done` AND `next_try` < ?", $priority, DateTimeFormat::utcNow()];
2020-12-03 15:47:50 +00:00
$tasks = DBA::select('workerqueue', ['id', 'command', 'parameter'], $condition, ['limit' => $limit, 'order' => ['retrial', 'created']]);
2019-02-16 15:03:37 +00:00
self::$db_duration += (microtime(true) - $stamp);
while ($task = DBA::fetch($tasks)) {
$ids[] = $task['id'];
// Only continue that loop while we are storing commands that can be processed quickly
2020-12-03 15:47:50 +00:00
if (!empty($task['command'])) {
$command = $task['command'];
} else {
$command = json_decode($task['parameter'])[0];
}
if (!in_array($command, self::FAST_COMMANDS)) {
break;
}
2019-02-16 15:03:37 +00:00
}
DBA::close($tasks);
Logger::info('Found:', ['priority' => $priority, 'id' => $ids]);
2019-02-16 15:03:37 +00:00
return $ids;
}
2019-02-17 19:20:24 +00:00
/**
2020-01-19 06:05:23 +00:00
* Returns the priority of the next workerqueue job
2019-02-17 19:20:24 +00:00
*
* @return string priority
* @throws \Exception
*/
2019-02-17 18:55:17 +00:00
private static function nextPriority()
2019-02-16 15:03:37 +00:00
{
$waiting = [];
$priorities = [PRIORITY_CRITICAL, PRIORITY_HIGH, PRIORITY_MEDIUM, PRIORITY_LOW, PRIORITY_NEGLIGIBLE];
foreach ($priorities as $priority) {
$stamp = (float)microtime(true);
if (DBA::exists('workerqueue', ["`priority` = ? AND `pid` = 0 AND NOT `done` AND `next_try` < ?", $priority, DateTimeFormat::utcNow()])) {
$waiting[$priority] = true;
}
self::$db_duration += (microtime(true) - $stamp);
}
if (!empty($waiting[PRIORITY_CRITICAL])) {
return PRIORITY_CRITICAL;
}
$running = [];
$running_total = 0;
2019-02-16 15:03:37 +00:00
$stamp = (float)microtime(true);
$processes = DBA::p("SELECT COUNT(DISTINCT(`pid`)) AS `running`, `priority` FROM `workerqueue-view` GROUP BY `priority`");
2019-02-16 15:03:37 +00:00
self::$db_duration += (microtime(true) - $stamp);
while ($process = DBA::fetch($processes)) {
$running[$process['priority']] = $process['running'];
$running_total += $process['running'];
2019-02-16 15:03:37 +00:00
}
DBA::close($processes);
foreach ($priorities as $priority) {
if (!empty($waiting[$priority]) && empty($running[$priority])) {
2019-02-21 19:32:31 +00:00
Logger::info('No running worker found with priority {priority} - assigning it.', ['priority' => $priority]);
2019-02-16 15:03:37 +00:00
return $priority;
}
}
$active = max(self::activeWorkers(), $running_total);
$priorities = max(count($waiting), count($running));
$exponent = 2;
$total = 0;
for ($i = 1; $i <= $priorities; ++$i) {
$total += pow($i, $exponent);
2019-02-16 15:03:37 +00:00
}
$limit = [];
for ($i = 1; $i <= $priorities; ++$i) {
$limit[$priorities - $i] = max(1, round($active * (pow($i, $exponent) / $total)));
}
$i = 0;
foreach ($running as $priority => $workers) {
if ($workers < $limit[$i++]) {
2019-02-21 19:32:31 +00:00
Logger::info('Priority {priority} has got {workers} workers out of a limit of {limit}', ['priority' => $priority, 'workers' => $workers, 'limit' => $limit[$i - 1]]);
return $priority;
}
2019-02-16 15:03:37 +00:00
}
if (!empty($waiting)) {
$priority = array_keys($waiting)[0];
2019-02-21 19:32:31 +00:00
Logger::info('No underassigned priority found, now taking the highest priority.', ['priority' => $priority]);
return $priority;
2019-02-16 15:03:37 +00:00
}
return false;
}
/**
2020-01-19 06:05:23 +00:00
* Find and claim the next worker process for us
*
* @return boolean Have we found something?
2019-01-06 16:06:53 -05:00
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
*/
2019-02-17 18:55:17 +00:00
private static function findWorkerProcesses()
{
$fetch_limit = DI::config()->get('system', 'worker_fetch_limit', 1);
if (DI::config()->get('system', 'worker_multiple_fetch')) {
$pids = [];
2020-08-29 10:44:38 +00:00
foreach (self::getWorkerPIDList() as $pid => $count) {
if ($count <= $fetch_limit) {
$pids[] = $pid;
}
}
if (empty($pids)) {
return;
}
$limit = $fetch_limit * count($pids);
} else {
$pids = [getmypid()];
$limit = $fetch_limit;
}
2019-02-16 15:03:37 +00:00
$ids = self::nextProcess($limit);
$limit -= count($ids);
// If there is not enough results we check without priority limit
if ($limit > 0) {
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
2019-02-17 19:20:24 +00:00
$condition = ["`pid` = 0 AND NOT `done` AND `next_try` < ?", DateTimeFormat::utcNow()];
2020-12-03 15:47:50 +00:00
$tasks = DBA::select('workerqueue', ['id', 'command', 'parameter'], $condition, ['limit' => $limit, 'order' => ['priority', 'retrial', 'created']]);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
while ($task = DBA::fetch($tasks)) {
$ids[] = $task['id'];
// Only continue that loop while we are storing commands that can be processed quickly
2020-12-03 15:47:50 +00:00
if (!empty($task['command'])) {
$command = $task['command'];
} else {
$command = json_decode($task['parameter'])[0];
}
if (!in_array($command, self::FAST_COMMANDS)) {
break;
}
}
DBA::close($tasks);
}
2020-08-29 10:44:38 +00:00
if (empty($ids)) {
return;
}
2020-08-29 10:44:38 +00:00
// Assign the task ids to the workers
$worker = [];
foreach (array_unique($ids) as $id) {
$pid = next($pids);
if (!$pid) {
$pid = reset($pids);
}
2020-08-29 10:44:38 +00:00
$worker[$pid][] = $id;
}
2020-08-29 10:44:38 +00:00
$stamp = (float)microtime(true);
foreach ($worker as $worker_pid => $worker_ids) {
Logger::info('Set queue entry', ['pid' => $worker_pid, 'ids' => $worker_ids]);
DBA::update('workerqueue', ['executed' => DateTimeFormat::utcNow(), 'pid' => $worker_pid],
['id' => $worker_ids, 'done' => false, 'pid' => 0]);
}
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_write += (microtime(true) - $stamp);
}
/**
2020-01-19 06:05:23 +00:00
* Returns the next worker process
*
2020-06-01 13:51:58 +00:00
* @return array worker processes
2019-01-06 16:06:53 -05:00
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
*/
2019-02-17 18:55:17 +00:00
public static function workerProcess()
{
// There can already be jobs for us in the queue.
2019-02-17 18:55:17 +00:00
$waiting = self::getWaitingJobForPID();
if (!empty($waiting)) {
return $waiting;
}
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
2020-08-06 18:53:45 +00:00
if (!DI::lock()->acquire(self::LOCK_PROCESS)) {
return false;
}
2019-02-09 23:10:15 +00:00
self::$lock_duration += (microtime(true) - $stamp);
2020-08-29 10:44:38 +00:00
self::findWorkerProcesses();
2020-08-06 18:53:45 +00:00
DI::lock()->release(self::LOCK_PROCESS);
2020-08-29 10:44:38 +00:00
return self::getWaitingJobForPID();
}
/**
2020-01-19 06:05:23 +00:00
* Removes a workerqueue entry from the current process
2020-01-19 09:51:37 +00:00
*
2021-10-24 20:43:59 +02:00
* @param Process $process the process behind the workerqueue
*
* @return void
2019-01-06 16:06:53 -05:00
* @throws \Exception
*/
2021-10-24 20:43:59 +02:00
public static function unclaimProcess(Process $process)
{
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
2021-10-24 20:43:59 +02:00
DBA::update('workerqueue', ['executed' => DBA::NULL_DATETIME, 'pid' => 0], ['pid' => $process->pid, 'done' => false]);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_write += (microtime(true) - $stamp);
}
/**
2020-01-19 06:05:23 +00:00
* Runs the cron processes
2020-01-19 09:51:37 +00:00
*
* @return void
2019-01-06 16:06:53 -05:00
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
*/
private static function runCron()
{
2020-06-01 13:51:58 +00:00
Logger::info('Add cron entries');
// Check for spooled items
self::add(['priority' => PRIORITY_HIGH, 'force_priority' => true], 'SpoolPost');
// Run the cron job that calls all other jobs
self::add(['priority' => PRIORITY_MEDIUM, 'force_priority' => true], 'Cron');
// Cleaning dead processes
self::killStaleWorkers();
// Remove old entries from the workerqueue
self::cleanWorkerQueue();
}
/**
* Remove old entries from the workerqueue
*
* @return void
*/
private static function cleanWorkerQueue()
{
DBA::delete('workerqueue', ["`done` AND `executed` < ?", DateTimeFormat::utc('now - 1 hour')]);
// Optimizing this table only last seconds
if (DI::config()->get('system', 'optimize_tables')) {
// We are acquiring the two locks from the worker to avoid locking problems
if (DI::lock()->acquire(Worker::LOCK_PROCESS, 10)) {
if (DI::lock()->acquire(Worker::LOCK_WORKER, 10)) {
DBA::e("OPTIMIZE TABLE `workerqueue`");
DBA::e("OPTIMIZE TABLE `process`");
DI::lock()->release(Worker::LOCK_WORKER);
}
DI::lock()->release(Worker::LOCK_PROCESS);
}
}
}
2021-01-01 19:35:29 +00:00
/**
* Fork a child process
*
* @param boolean $do_cron
* @return void
*/
private static function forkProcess(bool $do_cron)
{
2021-10-24 20:43:59 +02:00
if (DI::system()->isMinMemoryReached()) {
2021-01-01 23:10:38 +00:00
Logger::warning('Memory limit reached - quitting');
return;
}
2021-01-01 19:35:29 +00:00
// Children inherit their parent's database connection.
// To avoid problems we disconnect and connect both parent and child
DBA::disconnect();
$pid = pcntl_fork();
if ($pid == -1) {
DBA::connect();
Logger::warning('Could not spawn worker');
return;
} elseif ($pid) {
// The parent process continues here
DBA::connect();
2021-01-05 16:01:05 +00:00
2021-01-05 10:18:25 +00:00
self::IPCSetJobState(true, $pid);
2021-01-05 16:01:05 +00:00
Logger::info('Spawned new worker', ['pid' => $pid]);
2021-01-05 10:18:25 +00:00
$cycles = 0;
while (self::IPCJobsExists($pid) && (++$cycles < 100)) {
usleep(10000);
}
Logger::info('Spawned worker is ready', ['pid' => $pid, 'wait_cycles' => $cycles]);
2021-01-01 19:35:29 +00:00
return;
}
2021-01-02 08:43:55 +00:00
2021-01-01 19:35:29 +00:00
// We now are in the new worker
DBA::connect();
2021-10-24 20:43:59 +02:00
DI::flushLogger();
2021-11-01 13:54:18 +01:00
$process = DI::process()->create(getmypid(), basename(__FILE__));
2021-01-01 19:35:29 +00:00
2021-01-05 16:47:55 +00:00
$cycles = 0;
2021-10-31 20:23:23 +01:00
while (!self::IPCJobsExists($process->pid) && (++$cycles < 100)) {
2021-01-05 16:47:55 +00:00
usleep(10000);
}
2021-10-31 20:23:23 +01:00
Logger::info('Worker spawned', ['pid' => $process->pid, 'wait_cycles' => $cycles]);
2021-01-01 19:35:29 +00:00
2021-10-24 20:43:59 +02:00
self::processQueue($do_cron, $process);
2021-01-01 19:35:29 +00:00
2021-10-24 20:43:59 +02:00
self::unclaimProcess($process);
2021-01-01 19:35:29 +00:00
2021-10-31 20:23:23 +01:00
self::IPCSetJobState(false, $process->pid);
2021-10-24 20:43:59 +02:00
DI::process()->delete($process);
2021-10-31 20:23:23 +01:00
Logger::info('Worker ended', ['pid' => $process->pid]);
2021-01-01 19:35:29 +00:00
exit();
}
/**
2020-01-19 06:05:23 +00:00
* Spawns a new worker
2020-01-19 09:51:37 +00:00
*
2019-01-06 16:06:53 -05:00
* @param bool $do_cron
* @return void
2019-01-06 16:06:53 -05:00
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
*/
public static function spawnWorker($do_cron = false)
{
2021-01-05 10:18:25 +00:00
if (self::isDaemonMode() && DI::config()->get('system', 'worker_fork')) {
2021-01-01 19:35:29 +00:00
self::forkProcess($do_cron);
} else {
2021-10-24 20:43:59 +02:00
DI::system()->run('bin/worker.php', ['no_cron' => !$do_cron]);
2021-01-01 19:35:29 +00:00
}
2021-01-05 10:18:25 +00:00
if (self::isDaemonMode()) {
self::IPCSetJobState(false);
}
2017-11-05 15:28:55 +00:00
}
/**
2020-01-19 06:05:23 +00:00
* Adds tasks to the worker queue
*
2017-11-06 15:38:15 +00:00
* @param (integer|array) priority or parameter array, strings are deprecated and are ignored
*
* next args are passed as $cmd command line
* or: Worker::add(PRIORITY_HIGH, "Notifier", Delivery::DELETION, $drop_id);
2020-10-24 08:05:03 +00:00
* or: Worker::add(array('priority' => PRIORITY_HIGH, 'dont_fork' => true), "Delivery", $post_id);
*
2021-07-28 22:22:00 +00:00
* @return int "0" if worker queue entry already existed or there had been an error, otherwise the ID of the worker task
2019-01-06 16:06:53 -05:00
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
* @note $cmd and string args are surrounded with ""
*
* @hooks 'proc_run'
2019-01-06 16:06:53 -05:00
* array $arr
*
*/
public static function add(...$args)
{
if (!count($args)) {
2021-07-28 22:22:00 +00:00
return 0;
}
$arr = ['args' => $args, 'run_cmd' => true];
Hook::callAll("proc_run", $arr);
if (!$arr['run_cmd'] || !count($args)) {
2021-07-28 22:22:00 +00:00
return 1;
}
$priority = PRIORITY_MEDIUM;
// Don't fork from frontend tasks by default
$dont_fork = DI::config()->get("system", "worker_dont_fork", false) || !DI::mode()->isBackend();
$created = DateTimeFormat::utcNow();
$delayed = DBA::NULL_DATETIME;
$force_priority = false;
$run_parameter = array_shift($args);
if (is_int($run_parameter)) {
$priority = $run_parameter;
} elseif (is_array($run_parameter)) {
if (isset($run_parameter['delayed'])) {
$delayed = $run_parameter['delayed'];
}
if (isset($run_parameter['priority'])) {
$priority = $run_parameter['priority'];
}
if (isset($run_parameter['created'])) {
$created = $run_parameter['created'];
}
if (isset($run_parameter['dont_fork'])) {
$dont_fork = $run_parameter['dont_fork'];
}
if (isset($run_parameter['force_priority'])) {
$force_priority = $run_parameter['force_priority'];
}
} else {
throw new \InvalidArgumentException('Priority number or task parameter array expected as first argument');
}
2020-12-03 15:47:50 +00:00
$command = array_shift($args);
$parameters = json_encode($args);
2020-12-03 15:47:50 +00:00
$found = DBA::exists('workerqueue', ['command' => $command, 'parameter' => $parameters, 'done' => false]);
2021-07-28 22:22:00 +00:00
$added = 0;
2020-12-08 21:58:32 +00:00
if (!in_array($priority, PRIORITIES)) {
Logger::warning('Invalid priority', ['priority' => $priority, 'command' => $command, 'callstack' => System::callstack(20)]);
2020-12-08 21:58:32 +00:00
$priority = PRIORITY_MEDIUM;
}
// Quit if there was a database error - a precaution for the update process to 3.5.3
if (DBA::errorNo() != 0) {
2021-07-28 22:22:00 +00:00
return 0;
}
if (!$found) {
2021-07-28 22:22:00 +00:00
if (!DBA::insert('workerqueue', ['command' => $command, 'parameter' => $parameters, 'created' => $created,
'priority' => $priority, 'next_try' => $delayed])) {
return 0;
}
2021-07-28 22:22:00 +00:00
$added = DBA::lastInsertId();
} elseif ($force_priority) {
2020-12-03 15:47:50 +00:00
DBA::update('workerqueue', ['priority' => $priority], ['command' => $command, 'parameter' => $parameters, 'done' => false, 'pid' => 0]);
}
// Set the IPC flag to ensure an immediate process execution via daemon
2021-01-02 08:43:55 +00:00
if (self::isDaemonMode()) {
self::IPCSetJobState(true);
}
self::checkDaemonState();
2018-06-02 05:17:32 +00:00
// Should we quit and wait for the worker to be called as a cronjob?
if ($dont_fork) {
return $added;
}
// If there is a lock then we don't have to check for too much worker
2020-08-06 18:53:45 +00:00
if (!DI::lock()->acquire(self::LOCK_WORKER, 0)) {
return $added;
}
// If there are already enough workers running, don't fork another one
$quit = self::tooMuchWorkers();
2020-08-06 18:53:45 +00:00
DI::lock()->release(self::LOCK_WORKER);
if ($quit) {
return $added;
}
// Quit on daemon mode
2021-01-02 08:43:55 +00:00
if (self::isDaemonMode()) {
return $added;
}
2017-11-19 21:47:21 +00:00
// Now call the worker to execute the jobs that we just added to the queue
2017-11-05 15:28:55 +00:00
self::spawnWorker();
return $added;
}
2020-12-03 15:47:50 +00:00
public static function countWorkersByCommand(string $command)
{
return DBA::count('workerqueue', ['done' => false, 'pid' => 0, 'command' => $command]);
}
/**
* Returns the next retrial level for worker jobs.
* This function will skip levels when jobs are older.
*
* @param array $queue Worker queue entry
* @param integer $max_level maximum retrial level
* @return integer the next retrial level value
*/
private static function getNextRetrial($queue, $max_level)
{
$created = strtotime($queue['created']);
$retrial_time = time() - $created;
$new_retrial = $queue['retrial'] + 1;
$total = 0;
for ($retrial = 0; $retrial <= $max_level + 1; ++$retrial) {
$delay = (($retrial + 3) ** 4) + (rand(1, 30) * ($retrial + 1));
$total += $delay;
if (($total < $retrial_time) && ($retrial > $queue['retrial'])) {
$new_retrial = $retrial;
}
}
2020-12-31 20:14:13 +00:00
Logger::notice('New retrial for task', ['id' => $queue['id'], 'created' => $queue['created'], 'old' => $queue['retrial'], 'new' => $new_retrial]);
return $new_retrial;
}
2018-10-15 05:19:35 +00:00
/**
* Defers the current worker entry
2020-01-19 09:51:37 +00:00
*
* @return boolean had the entry been deferred?
* @throws \Exception
2018-10-15 05:19:35 +00:00
*/
public static function defer(): bool
2018-10-15 05:19:35 +00:00
{
2021-07-24 22:08:33 +00:00
$queue = DI::app()->getQueue();
if (empty($queue)) {
return false;
2018-10-15 05:19:35 +00:00
}
$queue = self::checkPriority($queue);
2018-10-15 05:19:35 +00:00
$id = $queue['id'];
$priority = $queue['priority'];
2018-10-15 05:19:35 +00:00
$max_level = DI::config()->get('system', 'worker_defer_limit');
2019-08-11 23:07:06 +02:00
$new_retrial = self::getNextRetrial($queue, $max_level);
if ($new_retrial > $max_level) {
2020-12-31 20:14:13 +00:00
Logger::notice('The task exceeded the maximum retry count', ['id' => $id, 'created' => $queue['created'], 'old_prio' => $queue['priority'], 'old_retrial' => $queue['retrial'], 'max_level' => $max_level, 'retrial' => $new_retrial]);
return false;
2018-10-15 05:19:35 +00:00
}
// Calculate the delay until the next trial
$delay = (($new_retrial + 2) ** 4) + (rand(1, 30) * ($new_retrial));
2018-10-15 05:19:35 +00:00
$next = DateTimeFormat::utc('now + ' . $delay . ' seconds');
if (($priority < PRIORITY_MEDIUM) && ($new_retrial > 3)) {
$priority = PRIORITY_MEDIUM;
} elseif (($priority < PRIORITY_LOW) && ($new_retrial > 6)) {
$priority = PRIORITY_LOW;
} elseif (($priority < PRIORITY_NEGLIGIBLE) && ($new_retrial > 8)) {
$priority = PRIORITY_NEGLIGIBLE;
}
Logger::info('Deferred task', ['id' => $id, 'retrial' => $new_retrial, 'created' => $queue['created'], 'next_execution' => $next, 'old_prio' => $queue['priority'], 'new_prio' => $priority]);
2018-10-15 05:19:35 +00:00
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
$fields = ['retrial' => $new_retrial, 'next_try' => $next, 'executed' => DBA::NULL_DATETIME, 'pid' => 0, 'priority' => $priority];
2018-10-15 05:19:35 +00:00
DBA::update('workerqueue', $fields, ['id' => $id]);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_write += (microtime(true) - $stamp);
return true;
2018-10-15 05:19:35 +00:00
}
/**
* Set the flag if some job is waiting
*
* @param boolean $jobs Is there a waiting job?
2021-01-05 16:01:05 +00:00
* @param int $key Key number
2019-01-06 16:06:53 -05:00
* @throws \Exception
*/
2021-01-05 10:18:25 +00:00
public static function IPCSetJobState(bool $jobs, int $key = 0)
{
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
2021-01-05 10:18:25 +00:00
DBA::replace('worker-ipc', ['jobs' => $jobs, 'key' => $key]);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_write += (microtime(true) - $stamp);
}
2021-01-05 16:01:05 +00:00
/**
* Delete a key entry
*
* @param int $key Key number
2019-01-06 16:06:53 -05:00
* @throws \Exception
*/
2021-01-05 16:01:05 +00:00
public static function IPCDeleteJobState(int $key)
{
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
2021-01-05 16:01:05 +00:00
DBA::delete('worker-ipc', ['key' => $key]);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
self::$db_duration_write += (microtime(true) - $stamp);
}
/**
* Checks if some worker job waits to be executed
*
2021-01-05 16:01:05 +00:00
* @param int $key Key number
* @return bool
2019-01-06 16:06:53 -05:00
* @throws \Exception
*/
2021-01-05 10:18:25 +00:00
public static function IPCJobsExists(int $key = 0)
{
2019-02-09 23:10:15 +00:00
$stamp = (float)microtime(true);
2021-01-05 10:18:25 +00:00
$row = DBA::selectFirst('worker-ipc', ['jobs'], ['key' => $key]);
2019-02-09 23:10:15 +00:00
self::$db_duration += (microtime(true) - $stamp);
// When we don't have a row, no job is running
2018-07-21 08:46:04 -04:00
if (!DBA::isResult($row)) {
return false;
}
return (bool)$row['jobs'];
}
2020-10-17 12:39:42 +00:00
/**
2021-01-02 08:43:55 +00:00
* Checks if the worker is running in the daemon mode.
*
* @return boolean
*/
public static function isDaemonMode()
{
if (!is_null(self::$daemon_mode)) {
return self::$daemon_mode;
}
if (DI::mode()->getExecutor() == Mode::DAEMON) {
return true;
}
$daemon_mode = DI::config()->get('system', 'worker_daemon_mode', false, true);
if ($daemon_mode) {
return $daemon_mode;
}
2021-01-03 22:57:25 +00:00
if (!function_exists('pcntl_fork')) {
self::$daemon_mode = false;
return false;
}
2021-01-02 08:43:55 +00:00
$pidfile = DI::config()->get('system', 'pidfile');
if (empty($pidfile)) {
// No pid file, no daemon
self::$daemon_mode = false;
return false;
}
if (!is_readable($pidfile)) {
// No pid file. We assume that the daemon had been intentionally stopped.
self::$daemon_mode = false;
return false;
}
$pid = intval(file_get_contents($pidfile));
$running = posix_kill($pid, 0);
self::$daemon_mode = $running;
return $running;
}
/**
* Test if the daemon is running. If not, it will be started
*
* @return void
*/
private static function checkDaemonState()
{
if (!DI::config()->get('system', 'daemon_watchdog', false)) {
return;
}
if (!DI::mode()->isNormal()) {
return;
}
// Check every minute if the daemon is running
if (DI::config()->get('system', 'last_daemon_check', 0) + 60 > time()) {
return;
}
DI::config()->set('system', 'last_daemon_check', time());
$pidfile = DI::config()->get('system', 'pidfile');
if (empty($pidfile)) {
// No pid file, no daemon
return;
}
if (!is_readable($pidfile)) {
// No pid file. We assume that the daemon had been intentionally stopped.
return;
}
$pid = intval(file_get_contents($pidfile));
if (posix_kill($pid, 0)) {
Logger::info('Daemon process is running', ['pid' => $pid]);
return;
}
Logger::warning('Daemon process is not running', ['pid' => $pid]);
self::spawnDaemon();
}
/**
* Spawn a new daemon process
*
* @return void
*/
private static function spawnDaemon()
{
2020-12-31 20:14:13 +00:00
Logger::notice('Starting new daemon process');
$command = 'bin/daemon.php';
$a = DI::app();
2021-10-24 20:43:59 +02:00
DI::system()->run($command, ['start']);
2020-12-31 20:14:13 +00:00
Logger::notice('New daemon process started');
}
2020-10-17 12:39:42 +00:00
/**
* Check if the system is inside the defined maintenance window
*
* @return boolean
*/
public static function isInMaintenanceWindow(bool $check_last_execution = false)
{
// Calculate the seconds of the start end end of the maintenance window
$start = strtotime(DI::config()->get('system', 'maintenance_start')) % 86400;
$end = strtotime(DI::config()->get('system', 'maintenance_end')) % 86400;
Logger::info('Maintenance window', ['start' => date('H:i:s', $start), 'end' => date('H:i:s', $end)]);
if ($check_last_execution) {
// Calculate the window duration
$duration = max($start, $end) - min($start, $end);
// Quit when the last cron execution had been after the previous window
$last_cron = DI::config()->get('system', 'last_cron_daily');
if ($last_cron + $duration > time()) {
Logger::info('The Daily cron had been executed recently', ['last' => date(DateTimeFormat::MYSQL, $last_cron), 'start' => date('H:i:s', $start), 'end' => date('H:i:s', $end)]);
return false;
}
}
$current = time() % 86400;
if ($start < $end) {
// Execute if we are inside the window
$execute = ($current >= $start) && ($current <= $end);
} else {
// Don't execute if we are outside the window
$execute = !(($current > $end) && ($current < $start));
}
if ($execute) {
2020-10-17 12:39:42 +00:00
Logger::info('We are inside the maintenance window', ['current' => date('H:i:s', $current), 'start' => date('H:i:s', $start), 'end' => date('H:i:s', $end)]);
} else {
Logger::info('We are outside the maintenance window', ['current' => date('H:i:s', $current), 'start' => date('H:i:s', $start), 'end' => date('H:i:s', $end)]);
2020-10-17 12:39:42 +00:00
}
2021-07-24 22:08:33 +00:00
2020-10-17 12:39:42 +00:00
return $execute;
}
}