]> git.mxchange.org Git - friendica.git/blob - src/Core/Worker.php
Makes the linear load calculation optional
[friendica.git] / src / Core / Worker.php
1 <?php
2 /**
3  * @file src/Core/Worker.php
4  */
5 namespace Friendica\Core;
6
7 use Friendica\Core\Addon;
8 use Friendica\Core\Config;
9 use Friendica\Core\System;
10 use Friendica\Database\DBM;
11 use Friendica\Model\Process;
12 use Friendica\Util\DateTimeFormat;
13 use Friendica\Util\Lock;
14 use Friendica\Util\Network;
15 use dba;
16
17 require_once 'include/dba.php';
18
19 /**
20  * @file src/Core/Worker.php
21  *
22  * @brief Contains the class for the worker background job processing
23  */
24
25 /**
26  * @brief Worker methods
27  */
28 class Worker
29 {
30         private static $up_start;
31         private static $db_duration;
32         private static $last_update;
33         private static $lock_duration;
34
35         /**
36          * @brief Processes the tasks that are in the workerqueue table
37          *
38          * @param boolean $run_cron Should the cron processes be executed?
39          * @return void
40          */
41         public static function processQueue($run_cron = true)
42         {
43                 $a = get_app();
44
45                 self::$up_start = microtime(true);
46
47                 // At first check the maximum load. We shouldn't continue with a high load
48                 if ($a->maxload_reached()) {
49                         logger('Pre check: maximum load reached, quitting.', LOGGER_DEBUG);
50                         return;
51                 }
52
53                 // We now start the process. This is done after the load check since this could increase the load.
54                 self::startProcess();
55
56                 // Kill stale processes every 5 minutes
57                 $last_cleanup = Config::get('system', 'worker_last_cleaned', 0);
58                 if (time() > ($last_cleanup + 300)) {
59                         Config::set('system', 'worker_last_cleaned', time());
60                         self::killStaleWorkers();
61                 }
62
63                 // Count active workers and compare them with a maximum value that depends on the load
64                 if (self::tooMuchWorkers()) {
65                         logger('Pre check: Active worker limit reached, quitting.', LOGGER_DEBUG);
66                         return;
67                 }
68
69                 // Do we have too few memory?
70                 if ($a->min_memory_reached()) {
71                         logger('Pre check: Memory limit reached, quitting.', LOGGER_DEBUG);
72                         return;
73                 }
74
75                 // Possibly there are too much database connections
76                 if (self::maxConnectionsReached()) {
77                         logger('Pre check: maximum connections reached, quitting.', LOGGER_DEBUG);
78                         return;
79                 }
80
81                 // Possibly there are too much database processes that block the system
82                 if ($a->max_processes_reached()) {
83                         logger('Pre check: maximum processes reached, quitting.', LOGGER_DEBUG);
84                         return;
85                 }
86
87                 // Now we start additional cron processes if we should do so
88                 if ($run_cron) {
89                         self::runCron();
90                 }
91
92                 $starttime = time();
93
94                 // We fetch the next queue entry that is about to be executed
95                 while ($r = self::workerProcess($passing_slow)) {
96                         // When we are processing jobs with a lower priority, we don't refetch new jobs
97                         // Otherwise fast jobs could wait behind slow ones and could be blocked.
98                         $refetched = $passing_slow;
99
100                         foreach ($r as $entry) {
101                                 // Assure that the priority is an integer value
102                                 $entry['priority'] = (int)$entry['priority'];
103
104                                 // The work will be done
105                                 if (!self::execute($entry)) {
106                                         logger('Process execution failed, quitting.', LOGGER_DEBUG);
107                                         return;
108                                 }
109
110                                 // If possible we will fetch new jobs for this worker
111                                 if (!$refetched && Lock::set('worker_process', 0)) {
112                                         $stamp = (float)microtime(true);
113                                         $refetched = self::findWorkerProcesses($passing_slow);
114                                         self::$db_duration += (microtime(true) - $stamp);
115                                         Lock::remove('worker_process');
116                                 }
117                         }
118
119                         // To avoid the quitting of multiple workers only one worker at a time will execute the check
120                         if (Lock::set('worker', 0)) {
121                                 $stamp = (float)microtime(true);
122                                 // Count active workers and compare them with a maximum value that depends on the load
123                                 if (self::tooMuchWorkers()) {
124                                         logger('Active worker limit reached, quitting.', LOGGER_DEBUG);
125                                         return;
126                                 }
127
128                                 // Check free memory
129                                 if ($a->min_memory_reached()) {
130                                         logger('Memory limit reached, quitting.', LOGGER_DEBUG);
131                                         return;
132                                 }
133                                 Lock::remove('worker');
134                                 self::$db_duration += (microtime(true) - $stamp);
135                         }
136
137                         // Quit the worker once every 5 minutes
138                         if (time() > ($starttime + 300)) {
139                                 logger('Process lifetime reached, quitting.', LOGGER_DEBUG);
140                                 return;
141                         }
142                 }
143
144                 // Cleaning up. Possibly not needed, but it doesn't harm anything.
145                 if (Config::get('system', 'worker_daemon_mode', false)) {
146                         self::IPCSetJobState(false);
147                 }
148                 logger("Couldn't select a workerqueue entry, quitting.", LOGGER_DEBUG);
149         }
150
151         /**
152          * @brief Returns the number of non executed entries in the worker queue
153          *
154          * @return integer Number of non executed entries in the worker queue
155          */
156         private static function totalEntries()
157         {
158                 return dba::count('workerqueue', ["`executed` <= ? AND NOT `done`", NULL_DATE]);
159         }
160
161         /**
162          * @brief Returns the highest priority in the worker queue that isn't executed
163          *
164          * @return integer Number of active worker processes
165          */
166         private static function highestPriority()
167         {
168                 $condition = ["`executed` <= ? AND NOT `done`", NULL_DATE];
169                 $workerqueue = dba::selectFirst('workerqueue', ['priority'], $condition, ['order' => ['priority']]);
170                 if (DBM::is_result($workerqueue)) {
171                         return $workerqueue["priority"];
172                 } else {
173                         return 0;
174                 }
175         }
176
177         /**
178          * @brief Returns if a process with the given priority is running
179          *
180          * @param integer $priority The priority that should be checked
181          *
182          * @return integer Is there a process running with that priority?
183          */
184         private static function processWithPriorityActive($priority)
185         {
186                 $condition = ["`priority` <= ? AND `executed` > ? AND NOT `done`", $priority, NULL_DATE];
187                 return dba::exists('workerqueue', $condition);
188         }
189
190         /**
191          * @brief Execute a worker entry
192          *
193          * @param array $queue Workerqueue entry
194          *
195          * @return boolean "true" if further processing should be stopped
196          */
197         public static function execute($queue)
198         {
199                 $a = get_app();
200
201                 $mypid = getmypid();
202
203                 // Quit when in maintenance
204                 if (Config::get('system', 'maintenance', false, true)) {
205                         logger("Maintenance mode - quit process ".$mypid, LOGGER_DEBUG);
206                         return false;
207                 }
208
209                 // Constantly check the number of parallel database processes
210                 if ($a->max_processes_reached()) {
211                         logger("Max processes reached for process ".$mypid, LOGGER_DEBUG);
212                         return false;
213                 }
214
215                 // Constantly check the number of available database connections to let the frontend be accessible at any time
216                 if (self::maxConnectionsReached()) {
217                         logger("Max connection reached for process ".$mypid, LOGGER_DEBUG);
218                         return false;
219                 }
220
221                 $argv = json_decode($queue["parameter"], true);
222
223                 // Check for existance and validity of the include file
224                 $include = $argv[0];
225
226                 if (method_exists(sprintf('Friendica\Worker\%s', $include), 'execute')) {
227                         // We constantly update the "executed" date every minute to avoid being killed too soon
228                         if (!isset(self::$last_update)) {
229                                 self::$last_update = strtotime($queue["executed"]);
230                         }
231
232                         $age = (time() - self::$last_update) / 60;
233                         self::$last_update = time();
234
235                         if ($age > 1) {
236                                 $stamp = (float)microtime(true);
237                                 dba::update('workerqueue', ['executed' => DateTimeFormat::utcNow()], ['pid' => $mypid, 'done' => false]);
238                                 self::$db_duration += (microtime(true) - $stamp);
239                         }
240
241                         array_shift($argv);
242
243                         self::execFunction($queue, $include, $argv, true);
244
245                         $stamp = (float)microtime(true);
246                         if (dba::update('workerqueue', ['done' => true], ['id' => $queue["id"]])) {
247                                 Config::set('system', 'last_worker_execution', DateTimeFormat::utcNow());
248                         }
249                         self::$db_duration = (microtime(true) - $stamp);
250
251                         return true;
252                 }
253
254                 // The script could be provided as full path or only with the function name
255                 if ($include == basename($include)) {
256                         $include = "include/".$include.".php";
257                 }
258
259                 if (!validate_include($include)) {
260                         logger("Include file ".$argv[0]." is not valid!");
261                         dba::delete('workerqueue', ['id' => $queue["id"]]);
262                         return true;
263                 }
264
265                 require_once $include;
266
267                 $funcname = str_replace(".php", "", basename($argv[0]))."_run";
268
269                 if (function_exists($funcname)) {
270                         // We constantly update the "executed" date every minute to avoid being killed too soon
271                         if (!isset(self::$last_update)) {
272                                 self::$last_update = strtotime($queue["executed"]);
273                         }
274
275                         $age = (time() - self::$last_update) / 60;
276                         self::$last_update = time();
277
278                         if ($age > 1) {
279                                 $stamp = (float)microtime(true);
280                                 dba::update('workerqueue', ['executed' => DateTimeFormat::utcNow()], ['pid' => $mypid, 'done' => false]);
281                                 self::$db_duration += (microtime(true) - $stamp);
282                         }
283
284                         self::execFunction($queue, $funcname, $argv, false);
285
286                         $stamp = (float)microtime(true);
287                         if (dba::update('workerqueue', ['done' => true], ['id' => $queue["id"]])) {
288                                 Config::set('system', 'last_worker_execution', DateTimeFormat::utcNow());
289                         }
290                         self::$db_duration = (microtime(true) - $stamp);
291                 } else {
292                         logger("Function ".$funcname." does not exist");
293                         dba::delete('workerqueue', ['id' => $queue["id"]]);
294                 }
295
296                 return true;
297         }
298
299         /**
300          * @brief Execute a function from the queue
301          *
302          * @param array   $queue       Workerqueue entry
303          * @param string  $funcname    name of the function
304          * @param array   $argv        Array of values to be passed to the function
305          * @param boolean $method_call boolean
306          * @return void
307          */
308         private static function execFunction($queue, $funcname, $argv, $method_call)
309         {
310                 $a = get_app();
311
312                 $mypid = getmypid();
313
314                 $argc = count($argv);
315
316                 $new_process_id = uniqid("wrk", true);
317
318                 logger("Process ".$mypid." - Prio ".$queue["priority"]." - ID ".$queue["id"].": ".$funcname." ".$queue["parameter"]." - Process PID: ".$new_process_id);
319
320                 $stamp = (float)microtime(true);
321
322                 // We use the callstack here to analyze the performance of executed worker entries.
323                 // For this reason the variables have to be initialized.
324                 if (Config::get("system", "profiler")) {
325                         $a->performance["start"] = microtime(true);
326                         $a->performance["database"] = 0;
327                         $a->performance["database_write"] = 0;
328                         $a->performance["cache"] = 0;
329                         $a->performance["cache_write"] = 0;
330                         $a->performance["network"] = 0;
331                         $a->performance["file"] = 0;
332                         $a->performance["rendering"] = 0;
333                         $a->performance["parser"] = 0;
334                         $a->performance["marktime"] = 0;
335                         $a->performance["markstart"] = microtime(true);
336                         $a->callstack = [];
337                 }
338
339                 // For better logging create a new process id for every worker call
340                 // But preserve the old one for the worker
341                 $old_process_id = $a->process_id;
342                 $a->process_id = $new_process_id;
343                 $a->queue = $queue;
344
345                 $up_duration = number_format(microtime(true) - self::$up_start, 3);
346
347                 // Reset global data to avoid interferences
348                 unset($_SESSION);
349
350                 if ($method_call) {
351                         call_user_func_array(sprintf('Friendica\Worker\%s::execute', $funcname), $argv);
352                 } else {
353                         $funcname($argv, $argc);
354                 }
355
356                 $a->process_id = $old_process_id;
357                 unset($a->queue);
358
359                 $duration = number_format(microtime(true) - $stamp, 3);
360
361                 self::$up_start = microtime(true);
362
363                 /* With these values we can analyze how effective the worker is.
364                  * The database and rest time should be low since this is the unproductive time.
365                  * The execution time is the productive time.
366                  * By changing parameters like the maximum number of workers we can check the effectivness.
367                 */
368                 logger(
369                         'DB: '.number_format(self::$db_duration, 2).
370                         ' - Lock: '.number_format(self::$lock_duration, 2).
371                         ' - Rest: '.number_format($up_duration - self::$db_duration - self::$lock_duration, 2).
372                         ' - Execution: '.number_format($duration, 2),
373                         LOGGER_DEBUG
374                 );
375
376                 self::$lock_duration = 0;
377
378                 if ($duration > 3600) {
379                         logger("Prio ".$queue["priority"].": ".$queue["parameter"]." - longer than 1 hour (".round($duration/60, 3).")", LOGGER_DEBUG);
380                 } elseif ($duration > 600) {
381                         logger("Prio ".$queue["priority"].": ".$queue["parameter"]." - longer than 10 minutes (".round($duration/60, 3).")", LOGGER_DEBUG);
382                 } elseif ($duration > 300) {
383                         logger("Prio ".$queue["priority"].": ".$queue["parameter"]." - longer than 5 minutes (".round($duration/60, 3).")", LOGGER_DEBUG);
384                 } elseif ($duration > 120) {
385                         logger("Prio ".$queue["priority"].": ".$queue["parameter"]." - longer than 2 minutes (".round($duration/60, 3).")", LOGGER_DEBUG);
386                 }
387
388                 logger("Process ".$mypid." - Prio ".$queue["priority"]." - ID ".$queue["id"].": ".$funcname." - done in ".$duration." seconds. Process PID: ".$new_process_id);
389
390                 // Write down the performance values into the log
391                 if (Config::get("system", "profiler")) {
392                         $duration = microtime(true)-$a->performance["start"];
393
394                         $o = '';
395                         if (Config::get("rendertime", "callstack")) {
396                                 if (isset($a->callstack["database"])) {
397                                         $o .= "\nDatabase Read:\n";
398                                         foreach ($a->callstack["database"] as $func => $time) {
399                                                 $time = round($time, 3);
400                                                 if ($time > 0) {
401                                                         $o .= $func.": ".$time."\n";
402                                                 }
403                                         }
404                                 }
405                                 if (isset($a->callstack["database_write"])) {
406                                         $o .= "\nDatabase Write:\n";
407                                         foreach ($a->callstack["database_write"] as $func => $time) {
408                                                 $time = round($time, 3);
409                                                 if ($time > 0) {
410                                                         $o .= $func.": ".$time."\n";
411                                                 }
412                                         }
413                                 }
414                                 if (isset($a->callstack["dache"])) {
415                                         $o .= "\nCache Read:\n";
416                                         foreach ($a->callstack["dache"] as $func => $time) {
417                                                 $time = round($time, 3);
418                                                 if ($time > 0) {
419                                                         $o .= $func.": ".$time."\n";
420                                                 }
421                                         }
422                                 }
423                                 if (isset($a->callstack["dache_write"])) {
424                                         $o .= "\nCache Write:\n";
425                                         foreach ($a->callstack["dache_write"] as $func => $time) {
426                                                 $time = round($time, 3);
427                                                 if ($time > 0) {
428                                                         $o .= $func.": ".$time."\n";
429                                                 }
430                                         }
431                                 }
432                                 if (isset($a->callstack["network"])) {
433                                         $o .= "\nNetwork:\n";
434                                         foreach ($a->callstack["network"] as $func => $time) {
435                                                 $time = round($time, 3);
436                                                 if ($time > 0) {
437                                                         $o .= $func.": ".$time."\n";
438                                                 }
439                                         }
440                                 }
441                         }
442
443                         logger(
444                                 "ID ".$queue["id"].": ".$funcname.": ".sprintf(
445                                         "DB: %s/%s, Cache: %s/%s, Net: %s, I/O: %s, Other: %s, Total: %s".$o,
446                                         number_format($a->performance["database"] - $a->performance["database_write"], 2),
447                                         number_format($a->performance["database_write"], 2),
448                                         number_format($a->performance["cache"], 2),
449                                         number_format($a->performance["cache_write"], 2),
450                                         number_format($a->performance["network"], 2),
451                                         number_format($a->performance["file"], 2),
452                                         number_format($duration - ($a->performance["database"]
453                                                 + $a->performance["cache"] + $a->performance["cache_write"]
454                                                 + $a->performance["network"] + $a->performance["file"]), 2),
455                                         number_format($duration, 2)
456                                 ),
457                                 LOGGER_DEBUG
458                         );
459                 }
460
461                 $cooldown = Config::get("system", "worker_cooldown", 0);
462
463                 if ($cooldown > 0) {
464                         logger("Process ".$mypid." - Prio ".$queue["priority"]." - ID ".$queue["id"].": ".$funcname." - in cooldown for ".$cooldown." seconds");
465                         sleep($cooldown);
466                 }
467         }
468
469         /**
470          * @brief Checks if the number of database connections has reached a critical limit.
471          *
472          * @return bool Are more than 3/4 of the maximum connections used?
473          */
474         private static function maxConnectionsReached()
475         {
476                 // Fetch the max value from the config. This is needed when the system cannot detect the correct value by itself.
477                 $max = Config::get("system", "max_connections");
478
479                 // Fetch the percentage level where the worker will get active
480                 $maxlevel = Config::get("system", "max_connections_level", 75);
481
482                 if ($max == 0) {
483                         // the maximum number of possible user connections can be a system variable
484                         $r = dba::fetch_first("SHOW VARIABLES WHERE `variable_name` = 'max_user_connections'");
485                         if (DBM::is_result($r)) {
486                                 $max = $r["Value"];
487                         }
488                         // Or it can be granted. This overrides the system variable
489                         $r = dba::p('SHOW GRANTS');
490                         while ($grants = dba::fetch($r)) {
491                                 $grant = array_pop($grants);
492                                 if (stristr($grant, "GRANT USAGE ON")) {
493                                         if (preg_match("/WITH MAX_USER_CONNECTIONS (\d*)/", $grant, $match)) {
494                                                 $max = $match[1];
495                                         }
496                                 }
497                         }
498                         dba::close($r);
499                 }
500
501                 // If $max is set we will use the processlist to determine the current number of connections
502                 // The processlist only shows entries of the current user
503                 if ($max != 0) {
504                         $r = dba::p('SHOW PROCESSLIST');
505                         $used = dba::num_rows($r);
506                         dba::close($r);
507
508                         logger("Connection usage (user values): ".$used."/".$max, LOGGER_DEBUG);
509
510                         $level = ($used / $max) * 100;
511
512                         if ($level >= $maxlevel) {
513                                 logger("Maximum level (".$maxlevel."%) of user connections reached: ".$used."/".$max);
514                                 return true;
515                         }
516                 }
517
518                 // We will now check for the system values.
519                 // This limit could be reached although the user limits are fine.
520                 $r = dba::fetch_first("SHOW VARIABLES WHERE `variable_name` = 'max_connections'");
521                 if (!DBM::is_result($r)) {
522                         return false;
523                 }
524                 $max = intval($r["Value"]);
525                 if ($max == 0) {
526                         return false;
527                 }
528                 $r = dba::fetch_first("SHOW STATUS WHERE `variable_name` = 'Threads_connected'");
529                 if (!DBM::is_result($r)) {
530                         return false;
531                 }
532                 $used = intval($r["Value"]);
533                 if ($used == 0) {
534                         return false;
535                 }
536                 logger("Connection usage (system values): ".$used."/".$max, LOGGER_DEBUG);
537
538                 $level = $used / $max * 100;
539
540                 if ($level < $maxlevel) {
541                         return false;
542                 }
543                 logger("Maximum level (".$level."%) of system connections reached: ".$used."/".$max);
544                 return true;
545         }
546
547         /**
548          * @brief fix the queue entry if the worker process died
549          * @return void
550          */
551         private static function killStaleWorkers()
552         {
553                 $entries = dba::select(
554                         'workerqueue',
555                         ['id', 'pid', 'executed', 'priority', 'parameter'],
556                         ['`executed` > ? AND NOT `done` AND `pid` != 0', NULL_DATE],
557                         ['order' => ['priority', 'created']]
558                 );
559
560                 while ($entry = dba::fetch($entries)) {
561                         if (!posix_kill($entry["pid"], 0)) {
562                                 dba::update(
563                                         'workerqueue',
564                                         ['executed' => NULL_DATE, 'pid' => 0],
565                                         ['id' => $entry["id"]]
566                                 );
567                         } else {
568                                 // Kill long running processes
569                                 // Check if the priority is in a valid range
570                                 if (!in_array($entry["priority"], [PRIORITY_CRITICAL, PRIORITY_HIGH, PRIORITY_MEDIUM, PRIORITY_LOW, PRIORITY_NEGLIGIBLE])) {
571                                         $entry["priority"] = PRIORITY_MEDIUM;
572                                 }
573
574                                 // Define the maximum durations
575                                 $max_duration_defaults = [PRIORITY_CRITICAL => 720, PRIORITY_HIGH => 10, PRIORITY_MEDIUM => 60, PRIORITY_LOW => 180, PRIORITY_NEGLIGIBLE => 720];
576                                 $max_duration = $max_duration_defaults[$entry["priority"]];
577
578                                 $argv = json_decode($entry["parameter"], true);
579                                 $argv[0] = basename($argv[0]);
580
581                                 // How long is the process already running?
582                                 $duration = (time() - strtotime($entry["executed"])) / 60;
583                                 if ($duration > $max_duration) {
584                                         logger("Worker process ".$entry["pid"]." (".implode(" ", $argv).") took more than ".$max_duration." minutes. It will be killed now.");
585                                         posix_kill($entry["pid"], SIGTERM);
586
587                                         // We killed the stale process.
588                                         // To avoid a blocking situation we reschedule the process at the beginning of the queue.
589                                         // Additionally we are lowering the priority. (But not PRIORITY_CRITICAL)
590                                         $new_priority = $entry["priority"];
591                                         if ($entry["priority"] == PRIORITY_HIGH) {
592                                                 $new_priority = PRIORITY_MEDIUM;
593                                         } elseif ($entry["priority"] == PRIORITY_MEDIUM) {
594                                                 $new_priority = PRIORITY_LOW;
595                                         } elseif ($entry["priority"] != PRIORITY_CRITICAL) {
596                                                 $new_priority = PRIORITY_NEGLIGIBLE;
597                                         }
598                                         dba::update(
599                                                 'workerqueue',
600                                                 ['executed' => NULL_DATE, 'created' => DateTimeFormat::utcNow(), 'priority' => $new_priority, 'pid' => 0],
601                                                 ['id' => $entry["id"]]
602                                         );
603                                 } else {
604                                         logger("Worker process ".$entry["pid"]." (".implode(" ", $argv).") now runs for ".round($duration)." of ".$max_duration." allowed minutes. That's okay.", LOGGER_DEBUG);
605                                 }
606                         }
607                 }
608         }
609
610         /**
611          * @brief Checks if the number of active workers exceeds the given limits
612          *
613          * @return bool Are there too much workers running?
614          */
615         public static function tooMuchWorkers()
616         {
617                 $queues = Config::get("system", "worker_queues", 4);
618
619                 $maxqueues = $queues;
620
621                 $active = self::activeWorkers();
622
623                 // Decrease the number of workers at higher load
624                 $load = current_load();
625                 if ($load) {
626                         $maxsysload = intval(Config::get("system", "maxloadavg", 50));
627
628                         if (Config::get('system', 'worker_linear_load', false)) {
629                                 /* The linear load calculation works fine if there is a low
630                                  * number of maximum queues and a high load base level.
631                                  * This can be present at shared hosters.
632                                 */
633                                 $tinyload = 1;
634
635                                 if ($load > $maxsysload) {
636                                         $queues = 0;
637                                 } elseif ($load > $tinyload) {
638                                         //Provide $queues number between 1 (below max load) and $maxqueues - 1 (above tiny load).
639                                         $range = $maxsysload - $tinyload;
640                                         $slope = 1.00 - (($load - $tinyload) / $range);
641                                         $target = $slope * ($maxqueues - 1);
642                                         $queues = intval(ceil($target));
643                                 }
644                         } else {
645                                 /* The exponentional load calculation respects the load behaviour
646                                  * of Linux systems with regular hardware that normally idles
647                                  * with load values near 0.
648                                 */
649                                 $maxworkers = $queues;
650
651                                 // Some magical mathemathics to reduce the workers
652                                 $exponent = 3;
653                                 $slope = $maxworkers / pow($maxsysload, $exponent);
654                                 $queues = ceil($slope * pow(max(0, $maxsysload - $load), $exponent));
655                         }
656
657                         $processlist = '';
658
659                         if (Config::get('system', 'worker_debug')) {
660                                 // Create a list of queue entries grouped by their priority
661                                 $listitem = [];
662
663                                 // Adding all processes with no workerqueue entry
664                                 $processes = dba::p(
665                                         "SELECT COUNT(*) AS `running` FROM `process` WHERE NOT EXISTS
666                                                         (SELECT id FROM `workerqueue`
667                                                         WHERE `workerqueue`.`pid` = `process`.`pid` AND NOT `done` AND `pid` != ?)",
668                                         getmypid()
669                                 );
670
671                                 if ($process = dba::fetch($processes)) {
672                                         $listitem[0] = "0:".$process["running"];
673                                 }
674                                 dba::close($processes);
675
676                                 // Now adding all processes with workerqueue entries
677                                 $entries = dba::p("SELECT COUNT(*) AS `entries`, `priority` FROM `workerqueue` WHERE NOT `done` GROUP BY `priority`");
678                                 while ($entry = dba::fetch($entries)) {
679                                         $processes = dba::p("SELECT COUNT(*) AS `running` FROM `process` INNER JOIN `workerqueue` ON `workerqueue`.`pid` = `process`.`pid` AND NOT `done` WHERE `priority` = ?", $entry["priority"]);
680                                         if ($process = dba::fetch($processes)) {
681                                                 $listitem[$entry["priority"]] = $entry["priority"].":".$process["running"]."/".$entry["entries"];
682                                         }
683                                         dba::close($processes);
684                                 }
685                                 dba::close($entries);
686
687                                 $intervals = [1, 10, 60];
688                                 $jobs_per_minute = [];
689                                 foreach ($intervals as $interval) {
690                                         $jobs = dba::p("SELECT COUNT(*) AS `jobs` FROM `workerqueue` WHERE `done` AND `executed` > UTC_TIMESTAMP() - INTERVAL ".intval($interval)." MINUTE");
691                                         if ($job = dba::fetch($jobs)) {
692                                                 $jobs_per_minute[$interval] = number_format($job['jobs'] / $interval, 0);
693                                         }
694                                         dba::close($jobs);
695                                 }
696                                 $processlist = ' - jpm: '.implode('/', $jobs_per_minute).' ('.implode(', ', $listitem).')';
697                         }
698
699                         $entries = self::totalEntries();
700
701                         if (Config::get("system", "worker_fastlane", false) && ($queues > 0) && ($entries > 0) && ($active >= $queues)) {
702                                 $top_priority = self::highestPriority();
703                                 $high_running = self::processWithPriorityActive($top_priority);
704
705                                 if (!$high_running && ($top_priority > PRIORITY_UNDEFINED) && ($top_priority < PRIORITY_NEGLIGIBLE)) {
706                                         logger("There are jobs with priority ".$top_priority." waiting but none is executed. Open a fastlane.", LOGGER_DEBUG);
707                                         $queues = $active + 1;
708                                 }
709                         }
710
711                         logger("Load: ".$load."/".$maxsysload." - processes: ".$active."/".$entries.$processlist." - maximum: ".$queues."/".$maxqueues, LOGGER_DEBUG);
712
713                         // Are there fewer workers running as possible? Then fork a new one.
714                         if (!Config::get("system", "worker_dont_fork", false) && ($queues > ($active + 1)) && ($entries > 1)) {
715                                 logger("Active workers: ".$active."/".$queues." Fork a new worker.", LOGGER_DEBUG);
716                                 if (Config::get('system', 'worker_daemon_mode', false)) {
717                                         self::IPCSetJobState(true);
718                                 } else {
719                                         self::spawnWorker();
720                                 }
721                         }
722                 }
723
724                 // if there are too much worker, we don't spawn a new one.
725                 if (Config::get('system', 'worker_daemon_mode', false) && ($active > $queues)) {
726                         self::IPCSetJobState(false);
727                 }
728
729                 return $active > $queues;
730         }
731
732         /**
733          * @brief Returns the number of active worker processes
734          *
735          * @return integer Number of active worker processes
736          */
737         private static function activeWorkers()
738         {
739                 return dba::count('process', ['command' => 'Worker.php']);
740         }
741
742         /**
743          * @brief Check if we should pass some slow processes
744          *
745          * When the active processes of the highest priority are using more than 2/3
746          * of all processes, we let pass slower processes.
747          *
748          * @param string $highest_priority Returns the currently highest priority
749          * @return bool We let pass a slower process than $highest_priority
750          */
751         private static function passingSlow(&$highest_priority)
752         {
753                 $highest_priority = 0;
754
755                 $r = dba::p(
756                         "SELECT `priority`
757                                 FROM `process`
758                                 INNER JOIN `workerqueue` ON `workerqueue`.`pid` = `process`.`pid` AND NOT `done`"
759                 );
760
761                 // No active processes at all? Fine
762                 if (!DBM::is_result($r)) {
763                         return false;
764                 }
765                 $priorities = [];
766                 while ($line = dba::fetch($r)) {
767                         $priorities[] = $line["priority"];
768                 }
769                 dba::close($r);
770
771                 // Should not happen
772                 if (count($priorities) == 0) {
773                         return false;
774                 }
775                 $highest_priority = min($priorities);
776
777                 // The highest process is already the slowest one?
778                 // Then we quit
779                 if ($highest_priority == PRIORITY_NEGLIGIBLE) {
780                         return false;
781                 }
782                 $high = 0;
783                 foreach ($priorities as $priority) {
784                         if ($priority == $highest_priority) {
785                                 ++$high;
786                         }
787                 }
788                 logger("Highest priority: ".$highest_priority." Total processes: ".count($priorities)." Count high priority processes: ".$high, LOGGER_DEBUG);
789                 $passing_slow = (($high/count($priorities)) > (2/3));
790
791                 if ($passing_slow) {
792                         logger("Passing slower processes than priority ".$highest_priority, LOGGER_DEBUG);
793                 }
794                 return $passing_slow;
795         }
796
797         /**
798          * @brief Find and claim the next worker process for us
799          *
800          * @param boolean $passing_slow Returns if we had passed low priority processes
801          * @return boolean Have we found something?
802          */
803         private static function findWorkerProcesses(&$passing_slow)
804         {
805                 $mypid = getmypid();
806
807                 // Check if we should pass some low priority process
808                 $highest_priority = 0;
809                 $found = false;
810                 $passing_slow = false;
811
812                 // The higher the number of parallel workers, the more we prefetch to prevent concurring access
813                 // We decrease the limit with the number of entries left in the queue
814                 $worker_queues = Config::get("system", "worker_queues", 4);
815                 $queue_length = Config::get('system', 'worker_fetch_limit', 1);
816                 $lower_job_limit = $worker_queues * $queue_length * 2;
817                 $jobs = self::totalEntries();
818
819                 // Now do some magic
820                 $exponent = 2;
821                 $slope = $queue_length / pow($lower_job_limit, $exponent);
822                 $limit = min($queue_length, ceil($slope * pow($jobs, $exponent)));
823
824                 logger('Total: '.$jobs.' - Maximum: '.$queue_length.' - jobs per queue: '.$limit, LOGGER_DEBUG);
825                 $ids = [];
826                 if (self::passingSlow($highest_priority)) {
827                         // Are there waiting processes with a higher priority than the currently highest?
828                         $result = dba::select(
829                                 'workerqueue',
830                                 ['id'],
831                                 ["`executed` <= ? AND `priority` < ? AND NOT `done`", NULL_DATE, $highest_priority],
832                                 ['limit' => $limit, 'order' => ['priority', 'created']]
833                         );
834
835                         while ($id = dba::fetch($result)) {
836                                 $ids[] = $id["id"];
837                         }
838                         dba::close($result);
839
840                         $found = (count($ids) > 0);
841
842                         if (!$found) {
843                                 // Give slower processes some processing time
844                                 $result = dba::select(
845                                         'workerqueue',
846                                         ['id'],
847                                         ["`executed` <= ? AND `priority` > ? AND NOT `done`", NULL_DATE, $highest_priority],
848                                         ['limit' => $limit, 'order' => ['priority', 'created']]
849                                 );
850
851                                 while ($id = dba::fetch($result)) {
852                                         $ids[] = $id["id"];
853                                 }
854                                 dba::close($result);
855
856                                 $found = (count($ids) > 0);
857                                 $passing_slow = $found;
858                         }
859                 }
860
861                 // If there is no result (or we shouldn't pass lower processes) we check without priority limit
862                 if (!$found) {
863                         $result = dba::select(
864                                 'workerqueue',
865                                 ['id'],
866                                 ["`executed` <= ? AND NOT `done`", NULL_DATE],
867                                 ['limit' => $limit, 'order' => ['priority', 'created']]
868                         );
869
870                         while ($id = dba::fetch($result)) {
871                                 $ids[] = $id["id"];
872                         }
873                         dba::close($result);
874
875                         $found = (count($ids) > 0);
876                 }
877
878                 if ($found) {
879                         $condition = "`id` IN (".substr(str_repeat("?, ", count($ids)), 0, -2).") AND `pid` = 0 AND NOT `done`";
880                         array_unshift($ids, $condition);
881                         dba::update('workerqueue', ['executed' => DateTimeFormat::utcNow(), 'pid' => $mypid], $ids);
882                 }
883
884                 return $found;
885         }
886
887         /**
888          * @brief Returns the next worker process
889          *
890          * @param boolean $passing_slow Returns if we had passed low priority processes
891          * @return string SQL statement
892          */
893         public static function workerProcess(&$passing_slow)
894         {
895                 $stamp = (float)microtime(true);
896
897                 // There can already be jobs for us in the queue.
898                 $r = dba::select('workerqueue', [], ['pid' => getmypid(), 'done' => false]);
899                 if (DBM::is_result($r)) {
900                         self::$db_duration += (microtime(true) - $stamp);
901                         return dba::inArray($r);
902                 }
903                 dba::close($r);
904
905                 $stamp = (float)microtime(true);
906                 if (!Lock::set('worker_process')) {
907                         return false;
908                 }
909                 self::$lock_duration = (microtime(true) - $stamp);
910
911                 $stamp = (float)microtime(true);
912                 $found = self::findWorkerProcesses($passing_slow);
913                 self::$db_duration += (microtime(true) - $stamp);
914
915                 Lock::remove('worker_process');
916
917                 if ($found) {
918                         $r = dba::select('workerqueue', [], ['pid' => getmypid(), 'done' => false]);
919                         return dba::inArray($r);
920                 }
921                 return false;
922         }
923
924         /**
925          * @brief Removes a workerqueue entry from the current process
926          * @return void
927          */
928         public static function unclaimProcess()
929         {
930                 $mypid = getmypid();
931
932                 dba::update('workerqueue', ['executed' => NULL_DATE, 'pid' => 0], ['pid' => $mypid, 'done' => false]);
933         }
934
935         /**
936          * @brief Call the front end worker
937          * @return void
938          */
939         public static function callWorker()
940         {
941                 if (!Config::get("system", "frontend_worker")) {
942                         return;
943                 }
944
945                 $url = System::baseUrl()."/worker";
946                 Network::fetchUrl($url, false, $redirects, 1);
947         }
948
949         /**
950          * @brief Call the front end worker if there aren't any active
951          * @return void
952          */
953         public static function executeIfIdle()
954         {
955                 if (!Config::get("system", "frontend_worker")) {
956                         return;
957                 }
958
959                 // Do we have "proc_open"? Then we can fork the worker
960                 if (function_exists("proc_open")) {
961                         // When was the last time that we called the worker?
962                         // Less than one minute? Then we quit
963                         if ((time() - Config::get("system", "worker_started")) < 60) {
964                                 return;
965                         }
966
967                         Config::set("system", "worker_started", time());
968
969                         // Do we have enough running workers? Then we quit here.
970                         if (self::tooMuchWorkers()) {
971                                 // Cleaning dead processes
972                                 self::killStaleWorkers();
973                                 Process::deleteInactive();
974
975                                 return;
976                         }
977
978                         self::runCron();
979
980                         logger('Call worker', LOGGER_DEBUG);
981                         self::spawnWorker();
982                         return;
983                 }
984
985                 // We cannot execute background processes.
986                 // We now run the processes from the frontend.
987                 // This won't work with long running processes.
988                 self::runCron();
989
990                 self::clearProcesses();
991
992                 $workers = self::activeWorkers();
993
994                 if ($workers == 0) {
995                         self::callWorker();
996                 }
997         }
998
999         /**
1000          * @brief Removes long running worker processes
1001          * @return void
1002          */
1003         public static function clearProcesses()
1004         {
1005                 $timeout = Config::get("system", "frontend_worker_timeout", 10);
1006
1007                 /// @todo We should clean up the corresponding workerqueue entries as well
1008                 $condition = ["`created` < ? AND `command` = 'worker.php'",
1009                                 DateTimeFormat::utc("now - ".$timeout." minutes")];
1010                 dba::delete('process', $condition);
1011         }
1012
1013         /**
1014          * @brief Runs the cron processes
1015          * @return void
1016          */
1017         private static function runCron()
1018         {
1019                 logger('Add cron entries', LOGGER_DEBUG);
1020
1021                 // Check for spooled items
1022                 self::add(PRIORITY_HIGH, "SpoolPost");
1023
1024                 // Run the cron job that calls all other jobs
1025                 self::add(PRIORITY_MEDIUM, "Cron");
1026
1027                 // Cleaning dead processes
1028                 self::killStaleWorkers();
1029         }
1030
1031         /**
1032          * @brief Spawns a new worker
1033          * @return void
1034          */
1035         public static function spawnWorker($do_cron = false)
1036         {
1037                 $args = ["bin/worker.php"];
1038
1039                 if (!$do_cron) {
1040                         $args[] = "no_cron";
1041                 }
1042
1043                 get_app()->proc_run($args);
1044
1045                 // after spawning we have to remove the flag.
1046                 if (Config::get('system', 'worker_daemon_mode', false)) {
1047                         self::IPCSetJobState(false);
1048                 }
1049         }
1050
1051         /**
1052          * @brief Adds tasks to the worker queue
1053          *
1054          * @param (integer|array) priority or parameter array, strings are deprecated and are ignored
1055          *
1056          * next args are passed as $cmd command line
1057          * or: Worker::add(PRIORITY_HIGH, "Notifier", "drop", $drop_id);
1058          * or: Worker::add(array('priority' => PRIORITY_HIGH, 'dont_fork' => true), "CreateShadowEntry", $post_id);
1059          *
1060          * @note $cmd and string args are surrounded with ""
1061          *
1062          * @hooks 'proc_run'
1063          *      array $arr
1064          *
1065          * @return boolean "false" if proc_run couldn't be executed
1066          */
1067         public static function add($cmd)
1068         {
1069                 $args = func_get_args();
1070
1071                 if (!count($args)) {
1072                         return false;
1073                 }
1074
1075                 $arr = ['args' => $args, 'run_cmd' => true];
1076
1077                 Addon::callHooks("proc_run", $arr);
1078                 if (!$arr['run_cmd'] || !count($args)) {
1079                         return true;
1080                 }
1081
1082                 $priority = PRIORITY_MEDIUM;
1083                 $dont_fork = Config::get("system", "worker_dont_fork", false);
1084                 $created = DateTimeFormat::utcNow();
1085
1086                 $run_parameter = array_shift($args);
1087
1088                 if (is_int($run_parameter)) {
1089                         $priority = $run_parameter;
1090                 } elseif (is_array($run_parameter)) {
1091                         if (isset($run_parameter['priority'])) {
1092                                 $priority = $run_parameter['priority'];
1093                         }
1094                         if (isset($run_parameter['created'])) {
1095                                 $created = $run_parameter['created'];
1096                         }
1097                         if (isset($run_parameter['dont_fork'])) {
1098                                 $dont_fork = $run_parameter['dont_fork'];
1099                         }
1100                 }
1101
1102                 $parameters = json_encode($args);
1103                 $found = dba::exists('workerqueue', ['parameter' => $parameters, 'done' => false]);
1104
1105                 // Quit if there was a database error - a precaution for the update process to 3.5.3
1106                 if (dba::errorNo() != 0) {
1107                         return false;
1108                 }
1109
1110                 if (!$found) {
1111                         dba::insert('workerqueue', ['parameter' => $parameters, 'created' => $created, 'priority' => $priority]);
1112                 }
1113
1114                 // Should we quit and wait for the worker to be called as a cronjob?
1115                 if ($dont_fork) {
1116                         return true;
1117                 }
1118
1119                 // If there is a lock then we don't have to check for too much worker
1120                 if (!Lock::set('worker', 0)) {
1121                         return true;
1122                 }
1123
1124                 // If there are already enough workers running, don't fork another one
1125                 $quit = self::tooMuchWorkers();
1126                 Lock::remove('worker');
1127
1128                 if ($quit) {
1129                         return true;
1130                 }
1131
1132                 // We tell the daemon that a new job entry exists
1133                 if (Config::get('system', 'worker_daemon_mode', false)) {
1134                         // We don't have to set the IPC flag - this is done in "tooMuchWorkers"
1135                         return true;
1136                 }
1137
1138                 // Now call the worker to execute the jobs that we just added to the queue
1139                 self::spawnWorker();
1140
1141                 return true;
1142         }
1143
1144         /**
1145          * Log active processes into the "process" table
1146          *
1147          * @brief Log active processes into the "process" table
1148          */
1149         public static function startProcess()
1150         {
1151                 $trace = debug_backtrace(DEBUG_BACKTRACE_IGNORE_ARGS, 1);
1152
1153                 $command = basename($trace[0]['file']);
1154
1155                 Process::deleteInactive();
1156
1157                 Process::insert($command);
1158         }
1159
1160         /**
1161          * Remove the active process from the "process" table
1162          *
1163          * @brief Remove the active process from the "process" table
1164          * @return bool
1165          */
1166         public static function endProcess()
1167         {
1168                 return Process::deleteByPid();
1169         }
1170
1171         /**
1172          * Set the flag if some job is waiting
1173          *
1174          * @brief Set the flag if some job is waiting
1175          * @param boolean $jobs Is there a waiting job?
1176          */
1177         public static function IPCSetJobState($jobs)
1178         {
1179                 dba::update('worker-ipc', ['jobs' => $jobs], ['key' => 1], true);
1180         }
1181
1182         /**
1183          * Checks if some worker job waits to be executed
1184          *
1185          * @brief Checks if some worker job waits to be executed
1186          * @return bool
1187          */
1188         public static function IPCJobsExists()
1189         {
1190                 $row = dba::selectFirst('worker-ipc', ['jobs'], ['key' => 1]);
1191
1192                 // When we don't have a row, no job is running
1193                 if (!DBM::is_result($row)) {
1194                         return false;
1195                 }
1196
1197                 return (bool)$row['jobs'];
1198         }
1199 }