]> git.mxchange.org Git - friendica.git/blob - include/cron.php
Merge pull request #3096 from annando/1701-index-again
[friendica.git] / include / cron.php
1 <?php
2 if (!file_exists("boot.php") AND (sizeof($_SERVER["argv"]) != 0)) {
3         $directory = dirname($_SERVER["argv"][0]);
4
5         if (substr($directory, 0, 1) != "/")
6                 $directory = $_SERVER["PWD"]."/".$directory;
7
8         $directory = realpath($directory."/..");
9
10         chdir($directory);
11 }
12
13 use \Friendica\Core\Config;
14
15 require_once("boot.php");
16 require_once("include/photos.php");
17 require_once("include/user.php");
18
19
20 function cron_run(&$argv, &$argc){
21         global $a, $db;
22
23         if(is_null($a)) {
24                 $a = new App;
25         }
26
27         if(is_null($db)) {
28                 @include(".htconfig.php");
29                 require_once("include/dba.php");
30                 $db = new dba($db_host, $db_user, $db_pass, $db_data);
31                 unset($db_host, $db_user, $db_pass, $db_data);
32         };
33
34         require_once('include/session.php');
35         require_once('include/datetime.php');
36         require_once('include/items.php');
37         require_once('include/Contact.php');
38         require_once('include/email.php');
39         require_once('include/socgraph.php');
40         require_once('mod/nodeinfo.php');
41         require_once('include/post_update.php');
42
43         Config::load();
44
45         // Don't check this stuff if the function is called by the poller
46         if (App::callstack() != "poller_run") {
47                 if ($a->maxload_reached())
48                         return;
49                 if (App::is_already_running('cron', 'include/cron.php', 540))
50                         return;
51         }
52
53         $last = get_config('system','last_cron');
54
55         $poll_interval = intval(get_config('system','cron_interval'));
56         if(! $poll_interval)
57                 $poll_interval = 10;
58
59         if($last) {
60                 $next = $last + ($poll_interval * 60);
61                 if($next > time()) {
62                         logger('cron intervall not reached');
63                         return;
64                 }
65         }
66
67         $a->set_baseurl(get_config('system','url'));
68
69         load_hooks();
70
71         logger('cron: start');
72
73         // run queue delivery process in the background
74
75         proc_run(PRIORITY_NEGLIGIBLE, "include/queue.php");
76
77         // run the process to discover global contacts in the background
78
79         proc_run(PRIORITY_LOW, "include/discover_poco.php");
80
81         // run the process to update locally stored global contacts in the background
82
83         proc_run(PRIORITY_LOW, "include/discover_poco.php", "checkcontact");
84
85         // Expire and remove user entries
86         cron_expire_and_remove_users();
87
88         // If the worker is active, split the jobs in several sub processes
89         if (get_config("system", "worker")) {
90                 // Check OStatus conversations
91                 proc_run(PRIORITY_MEDIUM, "include/cronjobs.php", "ostatus_mentions");
92
93                 // Check every conversation
94                 proc_run(PRIORITY_MEDIUM, "include/cronjobs.php", "ostatus_conversations");
95
96                 // Call possible post update functions
97                 proc_run(PRIORITY_LOW, "include/cronjobs.php", "post_update");
98
99                 // update nodeinfo data
100                 proc_run(PRIORITY_LOW, "include/cronjobs.php", "nodeinfo");
101         } else {
102                 // Check OStatus conversations
103                 // Check only conversations with mentions (for a longer time)
104                 ostatus::check_conversations(true);
105
106                 // Check every conversation
107                 ostatus::check_conversations(false);
108
109                 // Call possible post update functions
110                 // see include/post_update.php for more details
111                 post_update();
112
113                 // update nodeinfo data
114                 nodeinfo_cron();
115         }
116
117         // once daily run birthday_updates and then expire in background
118
119         $d1 = get_config('system','last_expire_day');
120         $d2 = intval(datetime_convert('UTC','UTC','now','d'));
121
122         if($d2 != intval($d1)) {
123
124                 update_contact_birthdays();
125
126                 proc_run(PRIORITY_LOW, "include/discover_poco.php", "suggestions");
127
128                 set_config('system','last_expire_day',$d2);
129
130                 proc_run(PRIORITY_LOW, 'include/expire.php');
131
132                 proc_run(PRIORITY_MEDIUM, 'include/dbclean.php');
133
134                 cron_update_photo_albums();
135         }
136
137         // Clear cache entries
138         cron_clear_cache($a);
139
140         // Repair missing Diaspora values in contacts
141         cron_repair_diaspora($a);
142
143         // Repair entries in the database
144         cron_repair_database();
145
146         // Poll contacts
147         cron_poll_contacts($argc, $argv);
148
149         logger('cron: end');
150
151         set_config('system','last_cron', time());
152
153         return;
154 }
155
156 /**
157  * @brief Update the cached values for the number of photo albums per user
158  */
159 function cron_update_photo_albums() {
160         $r = q("SELECT `uid` FROM `user` WHERE NOT `account_expired` AND NOT `account_removed`");
161         if (!dbm::is_result($r)) {
162                 return;
163         }
164
165         foreach ($r AS $user) {
166                 photo_albums($user['uid'], true);
167         }
168 }
169
170 /**
171  * @brief Expire and remove user entries
172  */
173 function cron_expire_and_remove_users() {
174         // expire any expired accounts
175         q("UPDATE user SET `account_expired` = 1 where `account_expired` = 0
176                 AND `account_expires_on` != '0000-00-00 00:00:00'
177                 AND `account_expires_on` < UTC_TIMESTAMP() ");
178
179         // delete user and contact records for recently removed accounts
180         $r = q("SELECT * FROM `user` WHERE `account_removed` AND `account_expires_on` < UTC_TIMESTAMP() - INTERVAL 3 DAY");
181         if ($r) {
182                 foreach($r as $user) {
183                         q("DELETE FROM `contact` WHERE `uid` = %d", intval($user['uid']));
184                         q("DELETE FROM `user` WHERE `uid` = %d", intval($user['uid']));
185                 }
186         }
187 }
188
189 /**
190  * @brief Poll contacts for unreceived messages
191  *
192  * @param Integer $argc Number of command line arguments
193  * @param Array $argv Array of command line arguments
194  */
195 function cron_poll_contacts($argc, $argv) {
196         $manual_id  = 0;
197         $generation = 0;
198         $force      = false;
199         $restart    = false;
200
201         if (($argc > 1) && ($argv[1] == 'force'))
202                 $force = true;
203
204         if (($argc > 1) && ($argv[1] == 'restart')) {
205                 $restart = true;
206                 $generation = intval($argv[2]);
207                 if (!$generation)
208                         killme();
209         }
210
211         if (($argc > 1) && intval($argv[1])) {
212                 $manual_id = intval($argv[1]);
213                 $force     = true;
214         }
215
216         $interval = intval(get_config('system','poll_interval'));
217         if (!$interval)
218                 $interval = ((get_config('system','delivery_interval') === false) ? 3 : intval(get_config('system','delivery_interval')));
219
220         // If we are using the worker we don't need a delivery interval
221         if (get_config("system", "worker"))
222                 $interval = false;
223
224         $sql_extra = (($manual_id) ? " AND `id` = $manual_id " : "");
225
226         reload_plugins();
227
228         $d = datetime_convert();
229
230         // Only poll from those with suitable relationships,
231         // and which have a polling address and ignore Diaspora since
232         // we are unable to match those posts with a Diaspora GUID and prevent duplicates.
233
234         $abandon_days = intval(get_config('system','account_abandon_days'));
235         if($abandon_days < 1)
236                 $abandon_days = 0;
237
238         $abandon_sql = (($abandon_days)
239                 ? sprintf(" AND `user`.`login_date` > UTC_TIMESTAMP() - INTERVAL %d DAY ", intval($abandon_days))
240                 : ''
241         );
242
243         $contacts = q("SELECT `contact`.`id` FROM `user`
244                         STRAIGHT_JOIN `contact`
245                         ON `contact`.`uid` = `user`.`uid` AND `contact`.`rel` IN (%d, %d) AND `contact`.`poll` != ''
246                                 AND `contact`.`network` IN ('%s', '%s', '%s', '%s', '%s', '%s') $sql_extra
247                                 AND NOT `contact`.`self` AND NOT `contact`.`blocked` AND NOT `contact`.`readonly`
248                                 AND NOT `contact`.`archive`
249                         WHERE NOT `user`.`account_expired` AND NOT `user`.`account_removed` $abandon_sql ORDER BY RAND()",
250                 intval(CONTACT_IS_SHARING),
251                 intval(CONTACT_IS_FRIEND),
252                 dbesc(NETWORK_DFRN),
253                 dbesc(NETWORK_ZOT),
254                 dbesc(NETWORK_OSTATUS),
255                 dbesc(NETWORK_FEED),
256                 dbesc(NETWORK_MAIL),
257                 dbesc(NETWORK_MAIL2)
258         );
259
260         if (!count($contacts)) {
261                 return;
262         }
263
264         foreach ($contacts as $c) {
265
266                 $res = q("SELECT * FROM `contact` WHERE `id` = %d LIMIT 1",
267                         intval($c['id'])
268                 );
269
270                 if (!dbm::is_result($res)) {
271                         continue;
272                 }
273
274                 foreach($res as $contact) {
275
276                         $xml = false;
277
278                         if($manual_id)
279                                 $contact['last-update'] = '0000-00-00 00:00:00';
280
281                         if(in_array($contact['network'], array(NETWORK_DFRN, NETWORK_ZOT, NETWORK_OSTATUS)))
282                                 $contact['priority'] = 2;
283
284                         if($contact['subhub'] AND in_array($contact['network'], array(NETWORK_DFRN, NETWORK_ZOT, NETWORK_OSTATUS))) {
285                                 // We should be getting everything via a hub. But just to be sure, let's check once a day.
286                                 // (You can make this more or less frequent if desired by setting 'pushpoll_frequency' appropriately)
287                                 // This also lets us update our subscription to the hub, and add or replace hubs in case it
288                                 // changed. We will only update hubs once a day, regardless of 'pushpoll_frequency'.
289
290                                 $poll_interval = get_config('system','pushpoll_frequency');
291                                 $contact['priority'] = (($poll_interval !== false) ? intval($poll_interval) : 3);
292                         }
293
294                         if($contact['priority'] AND !$force) {
295
296                                 $update     = false;
297
298                                 $t = $contact['last-update'];
299
300                                 /**
301                                  * Based on $contact['priority'], should we poll this site now? Or later?
302                                  */
303
304                                 switch ($contact['priority']) {
305                                         case 5:
306                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 month"))
307                                                         $update = true;
308                                                 break;
309                                         case 4:
310                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 week"))
311                                                         $update = true;
312                                                 break;
313                                         case 3:
314                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 day"))
315                                                         $update = true;
316                                                 break;
317                                         case 2:
318                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 12 hour"))
319                                                         $update = true;
320                                                 break;
321                                         case 1:
322                                         default:
323                                                 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 hour"))
324                                                         $update = true;
325                                                 break;
326                                 }
327                                 if (!$update)
328                                         continue;
329                         }
330
331                         logger("Polling ".$contact["network"]." ".$contact["id"]." ".$contact["nick"]." ".$contact["name"]);
332
333                         if (($contact['network'] == NETWORK_FEED) AND ($contact['priority'] <= 3)) {
334                                 proc_run(PRIORITY_MEDIUM, 'include/onepoll.php', $contact['id']);
335                         } else {
336                                 proc_run(PRIORITY_LOW, 'include/onepoll.php', $contact['id']);
337                         }
338
339                         if($interval)
340                                 @time_sleep_until(microtime(true) + (float) $interval);
341                 }
342         }
343 }
344
345 /**
346  * @brief Clear cache entries
347  *
348  * @param App $a
349  */
350 function cron_clear_cache(App $a) {
351
352         $last = get_config('system','cache_last_cleared');
353
354         if($last) {
355                 $next = $last + (3600); // Once per hour
356                 $clear_cache = ($next <= time());
357         } else
358                 $clear_cache = true;
359
360         if (!$clear_cache)
361                 return;
362
363         // clear old cache
364         Cache::clear();
365
366         // clear old item cache files
367         clear_cache();
368
369         // clear cache for photos
370         clear_cache($a->get_basepath(), $a->get_basepath()."/photo");
371
372         // clear smarty cache
373         clear_cache($a->get_basepath()."/view/smarty3/compiled", $a->get_basepath()."/view/smarty3/compiled");
374
375         // clear cache for image proxy
376         if (!get_config("system", "proxy_disabled")) {
377                 clear_cache($a->get_basepath(), $a->get_basepath()."/proxy");
378
379                 $cachetime = get_config('system','proxy_cache_time');
380                 if (!$cachetime) $cachetime = PROXY_DEFAULT_TIME;
381
382                 q('DELETE FROM `photo` WHERE `uid` = 0 AND `resource-id` LIKE "pic:%%" AND `created` < NOW() - INTERVAL %d SECOND', $cachetime);
383         }
384
385         // Delete the cached OEmbed entries that are older than one year
386         q("DELETE FROM `oembed` WHERE `created` < NOW() - INTERVAL 3 MONTH");
387
388         // Delete the cached "parse_url" entries that are older than one year
389         q("DELETE FROM `parsed_url` WHERE `created` < NOW() - INTERVAL 3 MONTH");
390
391         // Maximum table size in megabyte
392         $max_tablesize = intval(get_config('system','optimize_max_tablesize')) * 1000000;
393         if ($max_tablesize == 0)
394                 $max_tablesize = 100 * 1000000; // Default are 100 MB
395
396         if ($max_tablesize > 0) {
397                 // Minimum fragmentation level in percent
398                 $fragmentation_level = intval(get_config('system','optimize_fragmentation')) / 100;
399                 if ($fragmentation_level == 0)
400                         $fragmentation_level = 0.3; // Default value is 30%
401
402                 // Optimize some tables that need to be optimized
403                 $r = q("SHOW TABLE STATUS");
404                 foreach($r as $table) {
405
406                         // Don't optimize tables that are too large
407                         if ($table["Data_length"] > $max_tablesize)
408                                 continue;
409
410                         // Don't optimize empty tables
411                         if ($table["Data_length"] == 0)
412                                 continue;
413
414                         // Calculate fragmentation
415                         $fragmentation = $table["Data_free"] / ($table["Data_length"] + $table["Index_length"]);
416
417                         logger("Table ".$table["Name"]." - Fragmentation level: ".round($fragmentation * 100, 2), LOGGER_DEBUG);
418
419                         // Don't optimize tables that needn't to be optimized
420                         if ($fragmentation < $fragmentation_level)
421                                 continue;
422
423                         // So optimize it
424                         logger("Optimize Table ".$table["Name"], LOGGER_DEBUG);
425                         q("OPTIMIZE TABLE `%s`", dbesc($table["Name"]));
426                 }
427         }
428
429         set_config('system','cache_last_cleared', time());
430 }
431
432 /**
433  * @brief Repair missing values in Diaspora contacts
434  *
435  * @param App $a
436  */
437 function cron_repair_diaspora(App $a) {
438         $r = q("SELECT `id`, `url` FROM `contact`
439                 WHERE `network` = '%s' AND (`batch` = '' OR `notify` = '' OR `poll` = '' OR pubkey = '')
440                         ORDER BY RAND() LIMIT 50", dbesc(NETWORK_DIASPORA));
441         if (dbm::is_result($r)) {
442                 foreach ($r AS $contact) {
443                         if (poco_reachable($contact["url"])) {
444                                 $data = probe_url($contact["url"]);
445                                 if ($data["network"] == NETWORK_DIASPORA) {
446                                         logger("Repair contact ".$contact["id"]." ".$contact["url"], LOGGER_DEBUG);
447                                         q("UPDATE `contact` SET `batch` = '%s', `notify` = '%s', `poll` = '%s', pubkey = '%s' WHERE `id` = %d",
448                                                 dbesc($data["batch"]), dbesc($data["notify"]), dbesc($data["poll"]), dbesc($data["pubkey"]),
449                                                 intval($contact["id"]));
450                                 }
451                         }
452                 }
453         }
454 }
455
456 /**
457  * @brief Do some repairs in database entries
458  *
459  */
460 function cron_repair_database() {
461
462         // Sometimes there seem to be issues where the "self" contact vanishes.
463         // We haven't found the origin of the problem by now.
464         $r = q("SELECT `uid` FROM `user` WHERE NOT EXISTS (SELECT `uid` FROM `contact` WHERE `contact`.`uid` = `user`.`uid` AND `contact`.`self`)");
465         if (dbm::is_result($r)) {
466                 foreach ($r AS $user) {
467                         logger('Create missing self contact for user '.$user['uid']);
468                         user_create_self_contact($user['uid']);
469                 }
470         }
471
472         // Set the parent if it wasn't set. (Shouldn't happen - but does sometimes)
473         // This call is very "cheap" so we can do it at any time without a problem
474         q("UPDATE `item` INNER JOIN `item` AS `parent` ON `parent`.`uri` = `item`.`parent-uri` AND `parent`.`uid` = `item`.`uid` SET `item`.`parent` = `parent`.`id` WHERE `item`.`parent` = 0");
475
476         // There was an issue where the nick vanishes from the contact table
477         q("UPDATE `contact` INNER JOIN `user` ON `contact`.`uid` = `user`.`uid` SET `nick` = `nickname` WHERE `self` AND `nick`=''");
478
479         // Update the global contacts for local users
480         $r = q("SELECT `uid` FROM `user` WHERE `verified` AND NOT `blocked` AND NOT `account_removed` AND NOT `account_expired`");
481         if (dbm::is_result($r))
482                 foreach ($r AS $user)
483                         update_gcontact_for_user($user["uid"]);
484
485         /// @todo
486         /// - remove thread entries without item
487         /// - remove sign entries without item
488         /// - remove children when parent got lost
489         /// - set contact-id in item when not present
490 }
491
492 if (array_search(__file__,get_included_files())===0){
493         cron_run($_SERVER["argv"],$_SERVER["argc"]);
494         killme();
495 }