]> git.mxchange.org Git - friendica.git/blob - include/cron.php
Merge remote-tracking branch 'upstream/develop' into 1610-priority-dbclean
[friendica.git] / include / cron.php
1 <?php
2 if (!file_exists("boot.php") AND (sizeof($_SERVER["argv"]) != 0)) {
3         $directory = dirname($_SERVER["argv"][0]);
4
5         if (substr($directory, 0, 1) != "/")
6                 $directory = $_SERVER["PWD"]."/".$directory;
7
8         $directory = realpath($directory."/..");
9
10         chdir($directory);
11 }
12
13 require_once("boot.php");
14
15
16 function cron_run(&$argv, &$argc){
17         global $a, $db;
18
19         if(is_null($a)) {
20                 $a = new App;
21         }
22
23         if(is_null($db)) {
24                 @include(".htconfig.php");
25                 require_once("include/dba.php");
26                 $db = new dba($db_host, $db_user, $db_pass, $db_data);
27                 unset($db_host, $db_user, $db_pass, $db_data);
28         };
29
30         require_once('include/session.php');
31         require_once('include/datetime.php');
32         require_once('include/items.php');
33         require_once('include/Contact.php');
34         require_once('include/email.php');
35         require_once('include/socgraph.php');
36         require_once('mod/nodeinfo.php');
37         require_once('include/post_update.php');
38
39         load_config('config');
40         load_config('system');
41
42         // Don't check this stuff if the function is called by the poller
43         if (App::callstack() != "poller_run") {
44                 if (App::maxload_reached())
45                         return;
46                 if (App::is_already_running('cron', 'include/cron.php', 540))
47                         return;
48         }
49
50         $last = get_config('system','last_cron');
51
52         $poll_interval = intval(get_config('system','cron_interval'));
53         if(! $poll_interval)
54                 $poll_interval = 10;
55
56         if($last) {
57                 $next = $last + ($poll_interval * 60);
58                 if($next > time()) {
59                         logger('cron intervall not reached');
60                         return;
61                 }
62         }
63
64         $a->set_baseurl(get_config('system','url'));
65
66         load_hooks();
67
68         logger('cron: start');
69
70         // run queue delivery process in the background
71
72         proc_run(PRIORITY_NEGLIGIBLE, "include/queue.php");
73
74         // run the process to discover global contacts in the background
75
76         proc_run(PRIORITY_LOW, "include/discover_poco.php");
77
78         // run the process to update locally stored global contacts in the background
79
80         proc_run(PRIORITY_LOW, "include/discover_poco.php", "checkcontact");
81
82         // Expire and remove user entries
83         cron_expire_and_remove_users();
84
85         // If the worker is active, split the jobs in several sub processes
86         if (get_config("system", "worker")) {
87                 // Check OStatus conversations
88                 proc_run(PRIORITY_MEDIUM, "include/cronjobs.php", "ostatus_mentions");
89
90                 // Check every conversation
91                 proc_run(PRIORITY_MEDIUM, "include/cronjobs.php", "ostatus_conversations");
92
93                 // Call possible post update functions
94                 proc_run(PRIORITY_LOW, "include/cronjobs.php", "post_update");
95
96                 // update nodeinfo data
97                 proc_run(PRIORITY_LOW, "include/cronjobs.php", "nodeinfo");
98         } else {
99                 // Check OStatus conversations
100                 // Check only conversations with mentions (for a longer time)
101                 ostatus::check_conversations(true);
102
103                 // Check every conversation
104                 ostatus::check_conversations(false);
105
106                 // Call possible post update functions
107                 // see include/post_update.php for more details
108                 post_update();
109
110                 // update nodeinfo data
111                 nodeinfo_cron();
112         }
113
114         // once daily run birthday_updates and then expire in background
115
116         $d1 = get_config('system','last_expire_day');
117         $d2 = intval(datetime_convert('UTC','UTC','now','d'));
118
119         if($d2 != intval($d1)) {
120
121                 update_contact_birthdays();
122
123                 proc_run(PRIORITY_LOW, "include/discover_poco.php", "suggestions");
124
125                 set_config('system','last_expire_day',$d2);
126
127                 proc_run(PRIORITY_LOW, 'include/expire.php');
128
129                 proc_run(PRIORITY_LOW, 'include/dbclean.php');
130
131                 cron_update_photo_albums();
132         }
133
134         // Clear cache entries
135         cron_clear_cache($a);
136
137         // Repair missing Diaspora values in contacts
138         cron_repair_diaspora($a);
139
140         // Repair entries in the database
141         cron_repair_database();
142
143         // Poll contacts
144         cron_poll_contacts($argc, $argv);
145
146         logger('cron: end');
147
148         set_config('system','last_cron', time());
149
150         return;
151 }
152
153 /**
154  * @brief Update the cached values for the number of photo albums per user
155  */
156 function cron_update_photo_albums() {
157         $r = q("SELECT `uid` FROM `user` WHERE NOT `account_expired` AND NOT `account_removed`");
158         if (!dbm::is_result($r))
159                 return;
160
161         foreach ($r AS $user) {
162                 photo_albums($user['uid'], true);
163         }
164 }
165
166 /**
167  * @brief Expire and remove user entries
168  */
169 function cron_expire_and_remove_users() {
170         // expire any expired accounts
171         q("UPDATE user SET `account_expired` = 1 where `account_expired` = 0
172                 AND `account_expires_on` != '0000-00-00 00:00:00'
173                 AND `account_expires_on` < UTC_TIMESTAMP() ");
174
175         // delete user and contact records for recently removed accounts
176         $r = q("SELECT * FROM `user` WHERE `account_removed` AND `account_expires_on` < UTC_TIMESTAMP() - INTERVAL 3 DAY");
177         if ($r) {
178                 foreach($r as $user) {
179                         q("DELETE FROM `contact` WHERE `uid` = %d", intval($user['uid']));
180                         q("DELETE FROM `user` WHERE `uid` = %d", intval($user['uid']));
181                 }
182         }
183 }
184
185 /**
186  * @brief Poll contacts for unreceived messages
187  *
188  * @param Integer $argc Number of command line arguments
189  * @param Array $argv Array of command line arguments
190  */
191 function cron_poll_contacts($argc, $argv) {
192         $manual_id  = 0;
193         $generation = 0;
194         $force      = false;
195         $restart    = false;
196
197         if (($argc > 1) && ($argv[1] == 'force'))
198                 $force = true;
199
200         if (($argc > 1) && ($argv[1] == 'restart')) {
201                 $restart = true;
202                 $generation = intval($argv[2]);
203                 if (!$generation)
204                         killme();
205         }
206
207         if (($argc > 1) && intval($argv[1])) {
208                 $manual_id = intval($argv[1]);
209                 $force     = true;
210         }
211
212         $interval = intval(get_config('system','poll_interval'));
213         if (!$interval)
214                 $interval = ((get_config('system','delivery_interval') === false) ? 3 : intval(get_config('system','delivery_interval')));
215
216         // If we are using the worker we don't need a delivery interval
217         if (get_config("system", "worker"))
218                 $interval = false;
219
220         $sql_extra = (($manual_id) ? " AND `id` = $manual_id " : "");
221
222         reload_plugins();
223
224         $d = datetime_convert();
225
226         // Only poll from those with suitable relationships,
227         // and which have a polling address and ignore Diaspora since
228         // we are unable to match those posts with a Diaspora GUID and prevent duplicates.
229
230         $abandon_days = intval(get_config('system','account_abandon_days'));
231         if($abandon_days < 1)
232                 $abandon_days = 0;
233
234         $abandon_sql = (($abandon_days)
235                 ? sprintf(" AND `user`.`login_date` > UTC_TIMESTAMP() - INTERVAL %d DAY ", intval($abandon_days))
236                 : ''
237         );
238
239         $contacts = q("SELECT `contact`.`id` FROM `contact` INNER JOIN `user` ON `user`.`uid` = `contact`.`uid`
240                 WHERE `rel` IN (%d, %d) AND `poll` != '' AND `network` IN ('%s', '%s', '%s', '%s', '%s', '%s')
241                 $sql_extra
242                 AND NOT `self` AND NOT `contact`.`blocked` AND NOT `contact`.`readonly` AND NOT `contact`.`archive`
243                 AND NOT `user`.`account_expired` AND NOT `user`.`account_removed` $abandon_sql ORDER BY RAND()",
244                 intval(CONTACT_IS_SHARING),
245                 intval(CONTACT_IS_FRIEND),
246                 dbesc(NETWORK_DFRN),
247                 dbesc(NETWORK_ZOT),
248                 dbesc(NETWORK_OSTATUS),
249                 dbesc(NETWORK_FEED),
250                 dbesc(NETWORK_MAIL),
251                 dbesc(NETWORK_MAIL2)
252         );
253
254         if (!count($contacts)) {
255                 return;
256         }
257
258         foreach ($contacts as $c) {
259
260                 $res = q("SELECT * FROM `contact` WHERE `id` = %d LIMIT 1",
261                         intval($c['id'])
262                 );
263
264                 if((! $res) || (! count($res)))
265                         continue;
266
267                 foreach($res as $contact) {
268
269                         $xml = false;
270
271                         if($manual_id)
272                                 $contact['last-update'] = '0000-00-00 00:00:00';
273
274                         if(in_array($contact['network'], array(NETWORK_DFRN, NETWORK_ZOT, NETWORK_OSTATUS)))
275                                 $contact['priority'] = 2;
276
277                         if($contact['subhub'] AND in_array($contact['network'], array(NETWORK_DFRN, NETWORK_ZOT, NETWORK_OSTATUS))) {
278                                 // We should be getting everything via a hub. But just to be sure, let's check once a day.
279                                 // (You can make this more or less frequent if desired by setting 'pushpoll_frequency' appropriately)
280                                 // This also lets us update our subscription to the hub, and add or replace hubs in case it
281                                 // changed. We will only update hubs once a day, regardless of 'pushpoll_frequency'.
282
283                                 $poll_interval = get_config('system','pushpoll_frequency');
284                                 $contact['priority'] = (($poll_interval !== false) ? intval($poll_interval) : 3);
285                         }
286
287                         if($contact['priority'] AND !$force) {
288
289                                 $update     = false;
290
291                                 $t = $contact['last-update'];
292
293                                 /**
294                                  * Based on $contact['priority'], should we poll this site now? Or later?
295                                  */
296
297                                 switch ($contact['priority']) {
298                                         case 5:
299                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 month"))
300                                                         $update = true;
301                                                 break;
302                                         case 4:
303                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 week"))
304                                                         $update = true;
305                                                 break;
306                                         case 3:
307                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 day"))
308                                                         $update = true;
309                                                 break;
310                                         case 2:
311                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 12 hour"))
312                                                         $update = true;
313                                                 break;
314                                         case 1:
315                                         default:
316                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 hour"))
317                                                         $update = true;
318                                                 break;
319                                 }
320                                 if (!$update)
321                                         continue;
322                         }
323
324                         logger("Polling ".$contact["network"]." ".$contact["id"]." ".$contact["nick"]." ".$contact["name"]);
325
326                         if ($contact["remote_self"]) {
327                                 proc_run(PRIORITY_MEDIUM, 'include/onepoll.php', $contact['id']);
328                         } else {
329                                 proc_run(PRIORITY_LOW, 'include/onepoll.php', $contact['id']);
330                         }
331
332                         if($interval)
333                                 @time_sleep_until(microtime(true) + (float) $interval);
334                 }
335         }
336 }
337
338 /**
339  * @brief Clear cache entries
340  *
341  * @param App $a
342  */
343 function cron_clear_cache(&$a) {
344
345         $last = get_config('system','cache_last_cleared');
346
347         if($last) {
348                 $next = $last + (3600); // Once per hour
349                 $clear_cache = ($next <= time());
350         } else
351                 $clear_cache = true;
352
353         if (!$clear_cache)
354                 return;
355
356         // clear old cache
357         Cache::clear();
358
359         // clear old item cache files
360         clear_cache();
361
362         // clear cache for photos
363         clear_cache($a->get_basepath(), $a->get_basepath()."/photo");
364
365         // clear smarty cache
366         clear_cache($a->get_basepath()."/view/smarty3/compiled", $a->get_basepath()."/view/smarty3/compiled");
367
368         // clear cache for image proxy
369         if (!get_config("system", "proxy_disabled")) {
370                 clear_cache($a->get_basepath(), $a->get_basepath()."/proxy");
371
372                 $cachetime = get_config('system','proxy_cache_time');
373                 if (!$cachetime) $cachetime = PROXY_DEFAULT_TIME;
374
375                 q('DELETE FROM `photo` WHERE `uid` = 0 AND `resource-id` LIKE "pic:%%" AND `created` < NOW() - INTERVAL %d SECOND', $cachetime);
376         }
377
378         // Delete the cached OEmbed entries that are older than one year
379         q("DELETE FROM `oembed` WHERE `created` < NOW() - INTERVAL 3 MONTH");
380
381         // Delete the cached "parse_url" entries that are older than one year
382         q("DELETE FROM `parsed_url` WHERE `created` < NOW() - INTERVAL 3 MONTH");
383
384         // Maximum table size in megabyte
385         $max_tablesize = intval(get_config('system','optimize_max_tablesize')) * 1000000;
386         if ($max_tablesize == 0)
387                 $max_tablesize = 100 * 1000000; // Default are 100 MB
388
389         if ($max_tablesize > 0) {
390                 // Minimum fragmentation level in percent
391                 $fragmentation_level = intval(get_config('system','optimize_fragmentation')) / 100;
392                 if ($fragmentation_level == 0)
393                         $fragmentation_level = 0.3; // Default value is 30%
394
395                 // Optimize some tables that need to be optimized
396                 $r = q("SHOW TABLE STATUS");
397                 foreach($r as $table) {
398
399                         // Don't optimize tables that are too large
400                         if ($table["Data_length"] > $max_tablesize)
401                                 continue;
402
403                         // Don't optimize empty tables
404                         if ($table["Data_length"] == 0)
405                                 continue;
406
407                         // Calculate fragmentation
408                         $fragmentation = $table["Data_free"] / ($table["Data_length"] + $table["Index_length"]);
409
410                         logger("Table ".$table["Name"]." - Fragmentation level: ".round($fragmentation * 100, 2), LOGGER_DEBUG);
411
412                         // Don't optimize tables that needn't to be optimized
413                         if ($fragmentation < $fragmentation_level)
414                                 continue;
415
416                         // So optimize it
417                         logger("Optimize Table ".$table["Name"], LOGGER_DEBUG);
418                         q("OPTIMIZE TABLE `%s`", dbesc($table["Name"]));
419                 }
420         }
421
422         set_config('system','cache_last_cleared', time());
423 }
424
425 /**
426  * @brief Repair missing values in Diaspora contacts
427  *
428  * @param App $a
429  */
430 function cron_repair_diaspora(&$a) {
431         $r = q("SELECT `id`, `url` FROM `contact`
432                 WHERE `network` = '%s' AND (`batch` = '' OR `notify` = '' OR `poll` = '' OR pubkey = '')
433                         ORDER BY RAND() LIMIT 50", dbesc(NETWORK_DIASPORA));
434         if ($r) {
435                 foreach ($r AS $contact) {
436                         if (poco_reachable($contact["url"])) {
437                                 $data = probe_url($contact["url"]);
438                                 if ($data["network"] == NETWORK_DIASPORA) {
439                                         logger("Repair contact ".$contact["id"]." ".$contact["url"], LOGGER_DEBUG);
440                                         q("UPDATE `contact` SET `batch` = '%s', `notify` = '%s', `poll` = '%s', pubkey = '%s' WHERE `id` = %d",
441                                                 dbesc($data["batch"]), dbesc($data["notify"]), dbesc($data["poll"]), dbesc($data["pubkey"]),
442                                                 intval($contact["id"]));
443                                 }
444                         }
445                 }
446         }
447 }
448
449 /**
450  * @brief Do some repairs in database entries
451  *
452  */
453 function cron_repair_database() {
454
455         // Set the parent if it wasn't set. (Shouldn't happen - but does sometimes)
456         // This call is very "cheap" so we can do it at any time without a problem
457         q("UPDATE `item` INNER JOIN `item` AS `parent` ON `parent`.`uri` = `item`.`parent-uri` AND `parent`.`uid` = `item`.`uid` SET `item`.`parent` = `parent`.`id` WHERE `item`.`parent` = 0");
458
459         // There was an issue where the nick vanishes from the contact table
460         q("UPDATE `contact` INNER JOIN `user` ON `contact`.`uid` = `user`.`uid` SET `nick` = `nickname` WHERE `self` AND `nick`=''");
461
462         // Update the global contacts for local users
463         $r = q("SELECT `uid` FROM `user` WHERE `verified` AND NOT `blocked` AND NOT `account_removed` AND NOT `account_expired`");
464         if ($r)
465                 foreach ($r AS $user)
466                         update_gcontact_for_user($user["uid"]);
467
468         /// @todo
469         /// - remove thread entries without item
470         /// - remove sign entries without item
471         /// - remove children when parent got lost
472         /// - set contact-id in item when not present
473 }
474
475 if (array_search(__file__,get_included_files())===0){
476         cron_run($_SERVER["argv"],$_SERVER["argc"]);
477         killme();
478 }