]> git.mxchange.org Git - friendica.git/blob - include/cron.php
More transactions, more queries on uncommitted data
[friendica.git] / include / cron.php
1 <?php
2 if (!file_exists("boot.php") AND (sizeof($_SERVER["argv"]) != 0)) {
3         $directory = dirname($_SERVER["argv"][0]);
4
5         if (substr($directory, 0, 1) != "/")
6                 $directory = $_SERVER["PWD"]."/".$directory;
7
8         $directory = realpath($directory."/..");
9
10         chdir($directory);
11 }
12
13 require_once("boot.php");
14
15
16 function cron_run(&$argv, &$argc){
17         global $a, $db;
18
19         if(is_null($a)) {
20                 $a = new App;
21         }
22
23         if(is_null($db)) {
24                 @include(".htconfig.php");
25                 require_once("include/dba.php");
26                 $db = new dba($db_host, $db_user, $db_pass, $db_data);
27                 unset($db_host, $db_user, $db_pass, $db_data);
28         };
29
30         require_once('include/session.php');
31         require_once('include/datetime.php');
32         require_once('include/items.php');
33         require_once('include/Contact.php');
34         require_once('include/email.php');
35         require_once('include/socgraph.php');
36         require_once('mod/nodeinfo.php');
37         require_once('include/post_update.php');
38
39         load_config('config');
40         load_config('system');
41
42         // Don't check this stuff if the function is called by the poller
43         if (App::callstack() != "poller_run") {
44                 if (App::maxload_reached())
45                         return;
46                 if (App::is_already_running('cron', 'include/cron.php', 540))
47                         return;
48         }
49
50         $last = get_config('system','last_cron');
51
52         $poll_interval = intval(get_config('system','cron_interval'));
53         if(! $poll_interval)
54                 $poll_interval = 10;
55
56         if($last) {
57                 $next = $last + ($poll_interval * 60);
58                 if($next > time()) {
59                         logger('cron intervall not reached');
60                         return;
61                 }
62         }
63
64         $a->set_baseurl(get_config('system','url'));
65
66         load_hooks();
67
68         logger('cron: start');
69
70         // run queue delivery process in the background
71
72         proc_run(PRIORITY_NEGLIGIBLE, "include/queue.php");
73
74         // run the process to discover global contacts in the background
75
76         proc_run(PRIORITY_LOW, "include/discover_poco.php");
77
78         // run the process to update locally stored global contacts in the background
79
80         proc_run(PRIORITY_LOW, "include/discover_poco.php", "checkcontact");
81
82         // Expire and remove user entries
83         cron_expire_and_remove_users();
84
85         // If the worker is active, split the jobs in several sub processes
86         if (get_config("system", "worker")) {
87                 // Check OStatus conversations
88                 proc_run(PRIORITY_MEDIUM, "include/cronjobs.php", "ostatus_mentions");
89
90                 // Check every conversation
91                 proc_run(PRIORITY_MEDIUM, "include/cronjobs.php", "ostatus_conversations");
92
93                 // Call possible post update functions
94                 proc_run(PRIORITY_LOW, "include/cronjobs.php", "post_update");
95
96                 // update nodeinfo data
97                 proc_run(PRIORITY_LOW, "include/cronjobs.php", "nodeinfo");
98         } else {
99                 // Check OStatus conversations
100                 // Check only conversations with mentions (for a longer time)
101                 ostatus::check_conversations(true);
102
103                 // Check every conversation
104                 ostatus::check_conversations(false);
105
106                 // Call possible post update functions
107                 // see include/post_update.php for more details
108                 post_update();
109
110                 // update nodeinfo data
111                 nodeinfo_cron();
112         }
113
114         // once daily run birthday_updates and then expire in background
115
116         $d1 = get_config('system','last_expire_day');
117         $d2 = intval(datetime_convert('UTC','UTC','now','d'));
118
119         if($d2 != intval($d1)) {
120
121                 update_contact_birthdays();
122
123                 proc_run(PRIORITY_LOW, "include/discover_poco.php", "suggestions");
124
125                 set_config('system','last_expire_day',$d2);
126
127                 proc_run(PRIORITY_LOW, 'include/expire.php');
128
129                 if (get_config("system", "worker")) {
130                         proc_run(PRIORITY_LOW, 'include/dbclean.php', 1);
131                         proc_run(PRIORITY_LOW, 'include/dbclean.php', 2);
132                         proc_run(PRIORITY_LOW, 'include/dbclean.php', 3);
133                         proc_run(PRIORITY_LOW, 'include/dbclean.php', 4);
134                 } else {
135                         proc_run(PRIORITY_LOW, 'include/dbclean.php');
136                 }
137
138                 cron_update_photo_albums();
139         }
140
141         // Clear cache entries
142         cron_clear_cache($a);
143
144         // Repair missing Diaspora values in contacts
145         cron_repair_diaspora($a);
146
147         // Repair entries in the database
148         cron_repair_database();
149
150         // Poll contacts
151         cron_poll_contacts($argc, $argv);
152
153         logger('cron: end');
154
155         set_config('system','last_cron', time());
156
157         return;
158 }
159
160 /**
161  * @brief Update the cached values for the number of photo albums per user
162  */
163 function cron_update_photo_albums() {
164         $r = q("SELECT `uid` FROM `user` WHERE NOT `account_expired` AND NOT `account_removed`");
165         if (!dbm::is_result($r))
166                 return;
167
168         foreach ($r AS $user) {
169                 photo_albums($user['uid'], true);
170         }
171 }
172
173 /**
174  * @brief Expire and remove user entries
175  */
176 function cron_expire_and_remove_users() {
177         // expire any expired accounts
178         q("UPDATE user SET `account_expired` = 1 where `account_expired` = 0
179                 AND `account_expires_on` != '0000-00-00 00:00:00'
180                 AND `account_expires_on` < UTC_TIMESTAMP() ");
181
182         // delete user and contact records for recently removed accounts
183         $r = q("SELECT * FROM `user` WHERE `account_removed` AND `account_expires_on` < UTC_TIMESTAMP() - INTERVAL 3 DAY");
184         if ($r) {
185                 foreach($r as $user) {
186                         q("DELETE FROM `contact` WHERE `uid` = %d", intval($user['uid']));
187                         q("DELETE FROM `user` WHERE `uid` = %d", intval($user['uid']));
188                 }
189         }
190 }
191
192 /**
193  * @brief Poll contacts for unreceived messages
194  *
195  * @param Integer $argc Number of command line arguments
196  * @param Array $argv Array of command line arguments
197  */
198 function cron_poll_contacts($argc, $argv) {
199         $manual_id  = 0;
200         $generation = 0;
201         $force      = false;
202         $restart    = false;
203
204         if (($argc > 1) && ($argv[1] == 'force'))
205                 $force = true;
206
207         if (($argc > 1) && ($argv[1] == 'restart')) {
208                 $restart = true;
209                 $generation = intval($argv[2]);
210                 if (!$generation)
211                         killme();
212         }
213
214         if (($argc > 1) && intval($argv[1])) {
215                 $manual_id = intval($argv[1]);
216                 $force     = true;
217         }
218
219         $interval = intval(get_config('system','poll_interval'));
220         if (!$interval)
221                 $interval = ((get_config('system','delivery_interval') === false) ? 3 : intval(get_config('system','delivery_interval')));
222
223         // If we are using the worker we don't need a delivery interval
224         if (get_config("system", "worker"))
225                 $interval = false;
226
227         $sql_extra = (($manual_id) ? " AND `id` = $manual_id " : "");
228
229         reload_plugins();
230
231         $d = datetime_convert();
232
233         // Only poll from those with suitable relationships,
234         // and which have a polling address and ignore Diaspora since
235         // we are unable to match those posts with a Diaspora GUID and prevent duplicates.
236
237         $abandon_days = intval(get_config('system','account_abandon_days'));
238         if($abandon_days < 1)
239                 $abandon_days = 0;
240
241         $abandon_sql = (($abandon_days)
242                 ? sprintf(" AND `user`.`login_date` > UTC_TIMESTAMP() - INTERVAL %d DAY ", intval($abandon_days))
243                 : ''
244         );
245
246         $contacts = q("SELECT `contact`.`id` FROM `contact` INNER JOIN `user` ON `user`.`uid` = `contact`.`uid`
247                 WHERE `rel` IN (%d, %d) AND `poll` != '' AND `network` IN ('%s', '%s', '%s', '%s', '%s', '%s')
248                 $sql_extra
249                 AND NOT `self` AND NOT `contact`.`blocked` AND NOT `contact`.`readonly` AND NOT `contact`.`archive`
250                 AND NOT `user`.`account_expired` AND NOT `user`.`account_removed` $abandon_sql ORDER BY RAND()",
251                 intval(CONTACT_IS_SHARING),
252                 intval(CONTACT_IS_FRIEND),
253                 dbesc(NETWORK_DFRN),
254                 dbesc(NETWORK_ZOT),
255                 dbesc(NETWORK_OSTATUS),
256                 dbesc(NETWORK_FEED),
257                 dbesc(NETWORK_MAIL),
258                 dbesc(NETWORK_MAIL2)
259         );
260
261         if (!count($contacts)) {
262                 return;
263         }
264
265         foreach ($contacts as $c) {
266
267                 $res = q("SELECT * FROM `contact` WHERE `id` = %d LIMIT 1",
268                         intval($c['id'])
269                 );
270
271                 if((! $res) || (! count($res)))
272                         continue;
273
274                 foreach($res as $contact) {
275
276                         $xml = false;
277
278                         if($manual_id)
279                                 $contact['last-update'] = '0000-00-00 00:00:00';
280
281                         if(in_array($contact['network'], array(NETWORK_DFRN, NETWORK_ZOT, NETWORK_OSTATUS)))
282                                 $contact['priority'] = 2;
283
284                         if($contact['subhub'] AND in_array($contact['network'], array(NETWORK_DFRN, NETWORK_ZOT, NETWORK_OSTATUS))) {
285                                 // We should be getting everything via a hub. But just to be sure, let's check once a day.
286                                 // (You can make this more or less frequent if desired by setting 'pushpoll_frequency' appropriately)
287                                 // This also lets us update our subscription to the hub, and add or replace hubs in case it
288                                 // changed. We will only update hubs once a day, regardless of 'pushpoll_frequency'.
289
290                                 $poll_interval = get_config('system','pushpoll_frequency');
291                                 $contact['priority'] = (($poll_interval !== false) ? intval($poll_interval) : 3);
292                         }
293
294                         if($contact['priority'] AND !$force) {
295
296                                 $update     = false;
297
298                                 $t = $contact['last-update'];
299
300                                 /**
301                                  * Based on $contact['priority'], should we poll this site now? Or later?
302                                  */
303
304                                 switch ($contact['priority']) {
305                                         case 5:
306                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 month"))
307                                                         $update = true;
308                                                 break;
309                                         case 4:
310                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 week"))
311                                                         $update = true;
312                                                 break;
313                                         case 3:
314                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 day"))
315                                                         $update = true;
316                                                 break;
317                                         case 2:
318                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 12 hour"))
319                                                         $update = true;
320                                                 break;
321                                         case 1:
322                                         default:
323                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 hour"))
324                                                         $update = true;
325                                                 break;
326                                 }
327                                 if (!$update)
328                                         continue;
329                         }
330
331                         logger("Polling ".$contact["network"]." ".$contact["id"]." ".$contact["nick"]." ".$contact["name"]);
332
333                         proc_run(PRIORITY_MEDIUM, 'include/onepoll.php', $contact['id']);
334
335                         if($interval)
336                                 @time_sleep_until(microtime(true) + (float) $interval);
337                 }
338         }
339 }
340
341 /**
342  * @brief Clear cache entries
343  *
344  * @param App $a
345  */
346 function cron_clear_cache(&$a) {
347
348         $last = get_config('system','cache_last_cleared');
349
350         if($last) {
351                 $next = $last + (3600); // Once per hour
352                 $clear_cache = ($next <= time());
353         } else
354                 $clear_cache = true;
355
356         if (!$clear_cache)
357                 return;
358
359         // clear old cache
360         Cache::clear();
361
362         // clear old item cache files
363         clear_cache();
364
365         // clear cache for photos
366         clear_cache($a->get_basepath(), $a->get_basepath()."/photo");
367
368         // clear smarty cache
369         clear_cache($a->get_basepath()."/view/smarty3/compiled", $a->get_basepath()."/view/smarty3/compiled");
370
371         // clear cache for image proxy
372         if (!get_config("system", "proxy_disabled")) {
373                 clear_cache($a->get_basepath(), $a->get_basepath()."/proxy");
374
375                 $cachetime = get_config('system','proxy_cache_time');
376                 if (!$cachetime) $cachetime = PROXY_DEFAULT_TIME;
377
378                 q('DELETE FROM `photo` WHERE `uid` = 0 AND `resource-id` LIKE "pic:%%" AND `created` < NOW() - INTERVAL %d SECOND', $cachetime);
379         }
380
381         // Delete the cached OEmbed entries that are older than one year
382         q("DELETE FROM `oembed` WHERE `created` < NOW() - INTERVAL 3 MONTH");
383
384         // Delete the cached "parse_url" entries that are older than one year
385         q("DELETE FROM `parsed_url` WHERE `created` < NOW() - INTERVAL 3 MONTH");
386
387         // Maximum table size in megabyte
388         $max_tablesize = intval(get_config('system','optimize_max_tablesize')) * 1000000;
389         if ($max_tablesize == 0)
390                 $max_tablesize = 100 * 1000000; // Default are 100 MB
391
392         if ($max_tablesize > 0) {
393                 // Minimum fragmentation level in percent
394                 $fragmentation_level = intval(get_config('system','optimize_fragmentation')) / 100;
395                 if ($fragmentation_level == 0)
396                         $fragmentation_level = 0.3; // Default value is 30%
397
398                 // Optimize some tables that need to be optimized
399                 $r = q("SHOW TABLE STATUS");
400                 foreach($r as $table) {
401
402                         // Don't optimize tables that are too large
403                         if ($table["Data_length"] > $max_tablesize)
404                                 continue;
405
406                         // Don't optimize empty tables
407                         if ($table["Data_length"] == 0)
408                                 continue;
409
410                         // Calculate fragmentation
411                         $fragmentation = $table["Data_free"] / ($table["Data_length"] + $table["Index_length"]);
412
413                         logger("Table ".$table["Name"]." - Fragmentation level: ".round($fragmentation * 100, 2), LOGGER_DEBUG);
414
415                         // Don't optimize tables that needn't to be optimized
416                         if ($fragmentation < $fragmentation_level)
417                                 continue;
418
419                         // So optimize it
420                         logger("Optimize Table ".$table["Name"], LOGGER_DEBUG);
421                         q("OPTIMIZE TABLE `%s`", dbesc($table["Name"]));
422                 }
423         }
424
425         set_config('system','cache_last_cleared', time());
426 }
427
428 /**
429  * @brief Repair missing values in Diaspora contacts
430  *
431  * @param App $a
432  */
433 function cron_repair_diaspora(&$a) {
434         $r = q("SELECT `id`, `url` FROM `contact`
435                 WHERE `network` = '%s' AND (`batch` = '' OR `notify` = '' OR `poll` = '' OR pubkey = '')
436                         ORDER BY RAND() LIMIT 50", dbesc(NETWORK_DIASPORA));
437         if ($r) {
438                 foreach ($r AS $contact) {
439                         if (poco_reachable($contact["url"])) {
440                                 $data = probe_url($contact["url"]);
441                                 if ($data["network"] == NETWORK_DIASPORA) {
442                                         logger("Repair contact ".$contact["id"]." ".$contact["url"], LOGGER_DEBUG);
443                                         q("UPDATE `contact` SET `batch` = '%s', `notify` = '%s', `poll` = '%s', pubkey = '%s' WHERE `id` = %d",
444                                                 dbesc($data["batch"]), dbesc($data["notify"]), dbesc($data["poll"]), dbesc($data["pubkey"]),
445                                                 intval($contact["id"]));
446                                 }
447                         }
448                 }
449         }
450 }
451
452 /**
453  * @brief Do some repairs in database entries
454  *
455  */
456 function cron_repair_database() {
457
458         // Set the parent if it wasn't set. (Shouldn't happen - but does sometimes)
459         // This call is very "cheap" so we can do it at any time without a problem
460         q("UPDATE `item` INNER JOIN `item` AS `parent` ON `parent`.`uri` = `item`.`parent-uri` AND `parent`.`uid` = `item`.`uid` SET `item`.`parent` = `parent`.`id` WHERE `item`.`parent` = 0");
461
462         // There was an issue where the nick vanishes from the contact table
463         q("UPDATE `contact` INNER JOIN `user` ON `contact`.`uid` = `user`.`uid` SET `nick` = `nickname` WHERE `self` AND `nick`=''");
464
465         // Update the global contacts for local users
466         $r = q("SELECT `uid` FROM `user` WHERE `verified` AND NOT `blocked` AND NOT `account_removed` AND NOT `account_expired`");
467         if ($r)
468                 foreach ($r AS $user)
469                         update_gcontact_for_user($user["uid"]);
470
471         /// @todo
472         /// - remove thread entries without item
473         /// - remove sign entries without item
474         /// - remove children when parent got lost
475         /// - set contact-id in item when not present
476 }
477
478 if (array_search(__file__,get_included_files())===0){
479         cron_run($_SERVER["argv"],$_SERVER["argc"]);
480         killme();
481 }