]> git.mxchange.org Git - friendica.git/blobdiff - include/poller.php
Merge pull request #136 from annando/master
[friendica.git] / include / poller.php
old mode 100644 (file)
new mode 100755 (executable)
index b878ef2..3bc98e3
@@ -1,6 +1,8 @@
 <?php
+
 require_once("boot.php");
 
+
 function poller_run($argv, $argc){
        global $a, $db;
 
@@ -15,42 +17,87 @@ function poller_run($argv, $argc){
        unset($db_host, $db_user, $db_pass, $db_data);
        };
 
-       require_once('session.php');
-       require_once('datetime.php');
-       require_once('simplepie/simplepie.inc');
+
+       require_once('include/session.php');
+       require_once('include/datetime.php');
+       require_once('library/simplepie/simplepie.inc');
        require_once('include/items.php');
        require_once('include/Contact.php');
+       require_once('include/email.php');
+       require_once('include/socgraph.php');
+
+       load_config('config');
+       load_config('system');
 
        $a->set_baseurl(get_config('system','url'));
 
+       load_hooks();
+
        logger('poller: start');
        
        // run queue delivery process in the background
 
        proc_run('php',"include/queue.php");
        
-       // once daily run expire in background
+       // expire any expired accounts
+
+       q("UPDATE user SET `account_expired` = 1 where `account_expired` = 0 
+               AND `account_expires_on` != '0000-00-00 00:00:00' 
+               AND `account_expires_on` < UTC_TIMESTAMP() ");
+  
+       $abandon_days = intval(get_config('system','account_abandon_days'));
+       if($abandon_days < 1)
+               $abandon_days = 0;
+
+       
+
+       // once daily run birthday_updates and then expire in background
 
        $d1 = get_config('system','last_expire_day');
        $d2 = intval(datetime_convert('UTC','UTC','now','d'));
 
        if($d2 != intval($d1)) {
+
+               update_contact_birthdays();
+
+               update_suggestions();
+
                set_config('system','last_expire_day',$d2);
                proc_run('php','include/expire.php');
        }
 
-
        // clear old cache
-       q("DELETE FROM `cache` WHERE `updated` < '%s'",
-               dbesc(datetime_convert('UTC','UTC',"now - 30 days")));
+       Cache::clear();
+
+       // clear item cache files if they are older than one day
+       $cache = get_config('system','itemcache');
+       if (($cache != '') and is_dir($cache)) {
+               if ($dh = opendir($cache)) {
+                       while (($file = readdir($dh)) !== false) {
+                               $fullpath = $cache."/".$file;
+                               if ((filetype($fullpath) == "file") and filectime($fullpath) < (time() - 86400))
+                                       unlink($fullpath);
+                       }
+                       closedir($dh);
+               }
+       }
 
        $manual_id  = 0;
+       $generation = 0;
        $hub_update = false;
        $force      = false;
+       $restart    = false;
 
        if(($argc > 1) && ($argv[1] == 'force'))
                $force = true;
 
+       if(($argc > 1) && ($argv[1] == 'restart')) {
+               $restart = true;
+               $generation = intval($argv[2]);
+               if(! $generation)
+                       killme();               
+       }
+
        if(($argc > 1) && intval($argv[1])) {
                $manual_id = intval($argv[1]);
                $force     = true;
@@ -58,17 +105,32 @@ function poller_run($argv, $argc){
 
        $sql_extra = (($manual_id) ? " AND `id` = $manual_id " : "");
 
+       reload_plugins();
+
        $d = datetime_convert();
-       call_hooks('cron', $d);
 
-       reload_plugins();
+       if(! $restart)
+               proc_run('php','include/cronhooks.php');
+
+       // Only poll from those with suitable relationships,
+       // and which have a polling address and ignore Diaspora since 
+       // we are unable to match those posts with a Diaspora GUID and prevent duplicates.
+
+       $abandon_sql = (($abandon_days) 
+               ? sprintf(" AND `user`.`login_date` > UTC_TIMESTAMP() - INTERVAL %d DAY ", intval($abandon_days)) 
+               : '' 
+       );
 
-       $contacts = q("SELECT `id` FROM `contact
+       $contacts = q("SELECT `contact`.`id` FROM `contact` LEFT JOIN `user` ON `user`.`uid` = `contact`.`uid
                WHERE ( `rel` = %d OR `rel` = %d ) AND `poll` != ''
+               AND NOT `network` IN ( '%s', '%s' )
                $sql_extra 
-               AND `self` = 0 AND `blocked` = 0 AND `readonly` = 0 ORDER BY RAND()",
-               intval(REL_FAN),
-               intval(REL_BUD)
+               AND `self` = 0 AND `contact`.`blocked` = 0 AND `contact`.`readonly` = 0 
+               AND `user`.`account_expired` = 0 $abandon_sql ORDER BY RAND()",
+               intval(CONTACT_IS_SHARING),
+               intval(CONTACT_IS_FRIEND),
+               dbesc(NETWORK_DIASPORA),
+               dbesc(NETWORK_FACEBOOK)
        );
 
        if(! count($contacts)) {
@@ -81,13 +143,22 @@ function poller_run($argv, $argc){
                        intval($c['id'])
                );
 
-               if(! count($res))
+               if((! $res) || (! count($res)))
                        continue;
 
                foreach($res as $contact) {
+
+                       $xml = false;
+
                        if($manual_id)
                                $contact['last-update'] = '0000-00-00 00:00:00';
 
+                       if($contact['network'] === NETWORK_DFRN)
+                               $contact['priority'] = 2;
+
+                       if(!get_config('system','ostatus_use_priority') and ($contact['network'] === NETWORK_OSTATUS))
+                               $contact['priority'] = 2;
+
                        if($contact['priority'] || $contact['subhub']) {
 
                                $hub_update = true;
@@ -109,6 +180,8 @@ function poller_run($argv, $argc){
                                        if((datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 day")) || $force)
                                                        $hub_update = true;
                                }
+                               else
+                                       $hub_update = false;
 
                                /**
                                 * Based on $contact['priority'], should we poll this site now? Or later?
@@ -141,6 +214,22 @@ function poller_run($argv, $argc){
                                        continue;
                        }
 
+                       // Check to see if we are running out of memory - if so spawn a new process and kill this one
+
+                       $avail_memory = return_bytes(ini_get('memory_limit'));
+                       $memused = memory_get_peak_usage(true);
+                       if(intval($avail_memory)) {
+                               if(($memused / $avail_memory) > 0.95) {
+                                       if($generation + 1 > 10) {
+                                               logger('poller: maximum number of spawns exceeded. Terminating.');
+                                               killme();
+                                       }
+                                       logger('poller: memory exceeded. ' . $memused . ' bytes used. Spawning new poll.');
+                                       proc_run('php', 'include/poller.php', 'restart', (string) $generation + 1);
+                                       killme();
+                               }
+                       }
+
                        $importer_uid = $contact['uid'];
                
                        $r = q("SELECT * FROM `contact` WHERE `uid` = %d AND `self` = 1 LIMIT 1",
@@ -151,14 +240,14 @@ function poller_run($argv, $argc){
 
                        $importer = $r[0];
 
-                       logger("poller: poll: IMPORTER: {$importer['name']}, CONTACT: {$contact['name']}");
+                       logger("poller: poll: ({$contact['id']}) IMPORTER: {$importer['name']}, CONTACT: {$contact['name']}");
 
                        $last_update = (($contact['last-update'] === '0000-00-00 00:00:00') 
                                ? datetime_convert('UTC','UTC','now - 30 days', ATOM_TIME)
                                : datetime_convert('UTC','UTC',$contact['last-update'], ATOM_TIME)
                        );
 
-                       if($contact['network'] === 'dfrn') {
+                       if($contact['network'] === NETWORK_DFRN) {
 
                                $idtosend = $orig_id = (($contact['dfrn-id']) ? $contact['dfrn-id'] : $contact['issued-id']);
 
@@ -175,12 +264,12 @@ function poller_run($argv, $argc){
                                        . '&type=data&last_update=' . $last_update 
                                        . '&perm=' . $perm ;
        
-                               $xml = fetch_url($url);
+                               $handshake_xml = fetch_url($url);
 
-                               logger('poller: handshake with url ' . $url . ' returns xml: ' . $xml, LOGGER_DATA);
+                               logger('poller: handshake with url ' . $url . ' returns xml: ' . $handshake_xml, LOGGER_DATA);
 
 
-                               if(! $xml) {
+                               if(! $handshake_xml) {
                                        logger("poller: $url appears to be dead - marking for death ");
                                        // dead connection - might be a transient event, or this might
                                        // mean the software was uninstalled or the domain expired. 
@@ -197,7 +286,7 @@ function poller_run($argv, $argc){
                                        continue;
                                }
 
-                               if(! strstr($xml,'<?xml')) {
+                               if(! strstr($handshake_xml,'<?xml')) {
                                        logger('poller: response from ' . $url . ' did not contain XML.');
                                        $r = q("UPDATE `contact` SET `last-update` = '%s' WHERE `id` = %d LIMIT 1",
                                                dbesc(datetime_convert()),
@@ -207,7 +296,7 @@ function poller_run($argv, $argc){
                                }
 
 
-                               $res = parse_xml_string($xml);
+                               $res = parse_xml_string($handshake_xml);
        
                                if(intval($res->status) == 1) {
                                        logger("poller: $url replied status 1 - marking for death ");
@@ -232,6 +321,13 @@ function poller_run($argv, $argc){
                                if((intval($res->status) != 0) || (! strlen($res->challenge)) || (! strlen($res->dfrn_id)))
                                        continue;
 
+                               if(((float) $res->dfrn_version > 2.21) && ($contact['poco'] == '')) {
+                                       q("update contact set poco = '%s' where id = %d limit 1",
+                                               dbesc(str_replace('/profile/','/poco/', $contact['url'])),
+                                               intval($contact['id'])
+                                       );
+                               }
+
                                $postvars = array();
 
                                $sent_dfrn_id = hex2bin((string) $res->dfrn_id);
@@ -265,47 +361,255 @@ function poller_run($argv, $argc){
 
                                $xml = post_url($contact['poll'],$postvars);
                        }
-                       else {
+                       elseif(($contact['network'] === NETWORK_OSTATUS) 
+                               || ($contact['network'] === NETWORK_DIASPORA)
+                               || ($contact['network'] === NETWORK_FEED) ) {
+
+                               // Upgrading DB fields from an older Friendica version
+                               // Will only do this once per notify-enabled OStatus contact
+                               // or if relationship changes
 
-                               // $contact['network'] !== 'dfrn'
+                               $stat_writeable = ((($contact['notify']) && ($contact['rel'] == CONTACT_IS_FOLLOWER || $contact['rel'] == CONTACT_IS_FRIEND)) ? 1 : 0);
 
-                               if(($contact['notify']) && (! $contact['writable'])) {
-                                       q("UPDATE `contact` SET `writable` = 1 WHERE `id` = %d LIMIT 1",
+                               if($stat_writeable != $contact['writable']) {
+                                       q("UPDATE `contact` SET `writable` = %d WHERE `id` = %d LIMIT 1",
+                                               intval($stat_writeable),
                                                intval($contact['id'])
                                        );
                                }
+
+                               // Are we allowed to import from this person?
+
+                               if($contact['rel'] == CONTACT_IS_FOLLOWER || $contact['blocked'] || $contact['readonly'])
+                                       continue;
+
                                $xml = fetch_url($contact['poll']);
                        }
+                       elseif($contact['network'] === NETWORK_MAIL || $contact['network'] === NETWORK_MAIL2) {
 
-                       logger('poller: received xml : ' . $xml, LOGGER_DATA);
+                               logger("Mail: Fetching");
 
-                       if(! strstr($xml,'<?xml')) {
-                               logger('poller: post_handshake: response from ' . $url . ' did not contain XML.');
-                               $r = q("UPDATE `contact` SET `last-update` = '%s' WHERE `id` = %d LIMIT 1",
-                                       dbesc(datetime_convert()),
-                                       intval($contact['id'])
+                               $mail_disabled = ((function_exists('imap_open') && (! get_config('system','imap_disabled'))) ? 0 : 1);
+                               if($mail_disabled)
+                                       continue;
+
+                               logger("Mail: Enabled");
+
+                               $mbox = null;
+                               $x = q("SELECT `prvkey` FROM `user` WHERE `uid` = %d LIMIT 1",
+                                       intval($importer_uid)
                                );
-                               continue;
-                       }
+                               $mailconf = q("SELECT * FROM `mailacct` WHERE `server` != '' AND `uid` = %d LIMIT 1",
+                                       intval($importer_uid)
+                               );
+                               if(count($x) && count($mailconf)) {
+                                   $mailbox = construct_mailbox_name($mailconf[0]);
+                                       $password = '';
+                                       openssl_private_decrypt(hex2bin($mailconf[0]['pass']),$password,$x[0]['prvkey']);
+                                       $mbox = email_connect($mailbox,$mailconf[0]['user'],$password);
+                                       unset($password);
+                                       logger("Mail: Connect");
+                                       if($mbox) {
+                                               q("UPDATE `mailacct` SET `last_check` = '%s' WHERE `id` = %d AND `uid` = %d LIMIT 1",
+                                                       dbesc(datetime_convert()),
+                                                       intval($mailconf[0]['id']),
+                                                       intval($importer_uid)
+                                               );
+                                       }
+                               }
+                               if($mbox) {
+                                       logger("Mail: mbox");
+
+                                       $msgs = email_poll($mbox,$contact['addr']);
+
+                                       if(count($msgs)) {
+                                               logger("Mail: Parsing ".count($msgs)." mails.");
+
+                                               foreach($msgs as $msg_uid) {
+                                                       logger("Mail: Parsing mail ".$msg_uid);
+
+                                                       $datarray = array();
+                                                       $meta = email_msg_meta($mbox,$msg_uid);
+                                                       $headers = email_msg_headers($mbox,$msg_uid);
+
+                                                       // look for a 'references' header and try and match with a parent item we have locally.
+
+                                                       $raw_refs = ((x($headers,'references')) ? str_replace("\t",'',$headers['references']) : '');
+                                                       $datarray['uri'] = msgid2iri(trim($meta->message_id,'<>'));
+
+                                                       if($raw_refs) {
+                                                               $refs_arr = explode(' ', $raw_refs);
+                                                               if(count($refs_arr)) {
+                                                                       for($x = 0; $x < count($refs_arr); $x ++)
+                                                                               $refs_arr[$x] = "'" . msgid2iri(str_replace(array('<','>',' '),array('','',''),dbesc($refs_arr[$x]))) . "'";
+                                                               }
+                                                               $qstr = implode(',',$refs_arr);
+                                                               $r = q("SELECT `uri` , `parent-uri` FROM `item` WHERE `uri` IN ( $qstr ) AND `uid` = %d LIMIT 1",
+                                                                       intval($importer_uid)
+                                                               );
+                                                               if(count($r))
+                                                                       $datarray['parent-uri'] = $r[0]['uri'];
+                                                       }
+
+
+                                                       if(! x($datarray,'parent-uri'))
+                                                               $datarray['parent-uri'] = $datarray['uri'];
+
+                                                       // Have we seen it before?
+                                                       $r = q("SELECT * FROM `item` WHERE `uid` = %d AND `uri` = '%s' LIMIT 1",
+                                                               intval($importer_uid),
+                                                               dbesc($datarray['uri'])
+                                                       );
+
+                                                       if(count($r)) {
+                                                               logger("Mail: Seen before ".$msg_uid);
+                                                               if($meta->deleted && ! $r[0]['deleted']) {
+                                                                       q("UPDATE `item` SET `deleted` = 1, `changed` = '%s' WHERE `id` = %d LIMIT 1",
+                                                                               dbesc(datetime_convert()),
+                                                                               intval($r[0]['id'])
+                                                                       );
+                                                               }
+                                                               switch ($mailconf[0]['action']) {
+                                                                       case 0:
+                                                                               break;
+                                                                       case 1:
+                                                                               logger("Mail: Deleting ".$msg_uid);
+                                                                               imap_delete($mbox, $msg_uid, FT_UID);
+                                                                               break;
+                                                                       case 2:
+                                                                               logger("Mail: Mark as seen ".$msg_uid);
+                                                                               imap_setflag_full($mbox, $msg_uid, "\\Seen", ST_UID);
+                                                                               break;
+                                                                       case 3:
+                                                                               logger("Mail: Moving ".$msg_uid." to ".$mailconf[0]['movetofolder']);
+                                                                               imap_setflag_full($mbox, $msg_uid, "\\Seen", ST_UID);
+                                                                               if ($mailconf[0]['movetofolder'] != "")
+                                                                                       imap_mail_move($mbox, $msg_uid, $mailconf[0]['movetofolder'], FT_UID);
+                                                                               break;
+                                                               }
+                                                               continue;
+                                                       }
+
+                                                       // Decoding the header
+                                                       $subject = imap_mime_header_decode($meta->subject);
+                                                       $datarray['title'] = "";
+                                                       foreach($subject as $subpart)
+                                                               if ($subpart->charset != "default")
+                                                                       $datarray['title'] .= iconv($subpart->charset, 'UTF-8//IGNORE', $subpart->text);
+                                                               else
+                                                                       $datarray['title'] .= $subpart->text;
+
+                                                       $datarray['title'] = notags(trim($datarray['title']));
+
+                                                       //$datarray['title'] = notags(trim($meta->subject));
+                                                       $datarray['created'] = datetime_convert('UTC','UTC',$meta->date);
+
+                                                       $r = email_get_msg($mbox,$msg_uid);
+                                                       if(! $r) {
+                                                               logger("Mail: can't fetch msg ".$msg_uid);
+                                                               continue;
+                                                       }
+                                                       $datarray['body'] = escape_tags($r['body']);
+
+                                                       logger("Mail: Importing ".$msg_uid);
+
+                                                       // some mailing lists have the original author as 'from' - add this sender info to msg body.
+                                                       // todo: adding a gravatar for the original author would be cool
+
+                                                       if(! stristr($meta->from,$contact['addr'])) {
+                                                               $from = imap_mime_header_decode($meta->from);
+                                                               $fromdecoded = "";
+                                                               foreach($from as $frompart)
+                                                                       if ($frompart->charset != "default")
+                                                                               $fromdecoded .= iconv($frompart->charset, 'UTF-8//IGNORE', $frompart->text);
+                                                                       else
+                                                                               $fromdecoded .= $frompart->text;
+
+                                                               $datarray['body'] = "[b]".t('From: ') . escape_tags($fromdecoded) . "[/b]\n\n" . $datarray['body'];
+                                                       }
+
+                                                       $datarray['uid'] = $importer_uid;
+                                                       $datarray['contact-id'] = $contact['id'];
+                                                       if($datarray['parent-uri'] === $datarray['uri'])
+                                                               $datarray['private'] = 1;
+                                                       if(($contact['network'] === NETWORK_MAIL) && (! get_pconfig($importer_uid,'system','allow_public_email_replies'))) {
+                                                               $datarray['private'] = 1;
+                                                               $datarray['allow_cid'] = '<' . $contact['id'] . '>';
+                                                       }
+                                                       $datarray['author-name'] = $contact['name'];
+                                                       $datarray['author-link'] = 'mailbox';
+                                                       $datarray['author-avatar'] = $contact['photo'];
+
+                                                       $stored_item = item_store($datarray);
+                                                       q("UPDATE `item` SET `last-child` = 0 WHERE `parent-uri` = '%s' AND `uid` = %d",
+                                                               dbesc($datarray['parent-uri']),
+                                                               intval($importer_uid)
+                                                       );
+                                                       q("UPDATE `item` SET `last-child` = 1 WHERE `id` = %d LIMIT 1",
+                                                               intval($stored_item)
+                                                       );
+                                                       switch ($mailconf[0]['action']) {
+                                                               case 0:
+                                                                       break;
+                                                               case 1:
+                                                                       logger("Mail: Deleting ".$msg_uid);
+                                                                       imap_delete($mbox, $msg_uid, FT_UID);
+                                                                       break;
+                                                               case 2:
+                                                                       logger("Mail: Mark as seen ".$msg_uid);
+                                                                       imap_setflag_full($mbox, $msg_uid, "\\Seen", ST_UID);
+                                                                       break;
+                                                               case 3:
+                                                                       logger("Mail: Moving ".$msg_uid." to ".$mailconf[0]['movetofolder']);
+                                                                       imap_setflag_full($mbox, $msg_uid, "\\Seen", ST_UID);
+                                                                       if ($mailconf[0]['movetofolder'] != "")
+                                                                               imap_mail_move($mbox, $msg_uid, $mailconf[0]['movetofolder'], FT_UID);
+                                                                       break;
+                                                       }
+                                               }
+                                       }
 
+                                       imap_close($mbox);
+                               }
+                       }
+                       elseif($contact['network'] === NETWORK_FACEBOOK) {
+                               // This is picked up by the Facebook plugin on a cron hook.
+                               // Ignored here.
+                       }
 
-                       consume_feed($xml,$importer,$contact,$hub,1, true);
+                       if($xml) {
+                               logger('poller: received xml : ' . $xml, LOGGER_DATA);
 
-                       // do it twice. Ensures that children of parents which may be later in the stream aren't tossed
+                               if(! strstr($xml,'<?xml')) {
+                                       logger('poller: post_handshake: response from ' . $url . ' did not contain XML.');
+                                       $r = q("UPDATE `contact` SET `last-update` = '%s' WHERE `id` = %d LIMIT 1",
+                                               dbesc(datetime_convert()),
+                                               intval($contact['id'])
+                                       );
+                                       continue;
+                               }
 
-                       consume_feed($xml,$importer,$contact,$hub,1);
 
+                               consume_feed($xml,$importer,$contact,$hub,1,1);
 
-                       if((strlen($hub)) && ($hub_update) 
-                               && (($contact['rel'] == REL_BUD) || (($contact['network'] === 'stat') && (! $contact['readonly'])))) {
-                               logger('poller: subscribing to hub(s) : ' . $hub . ' contact name : ' . $contact['name'] . ' local user : ' . $importer['name']);
-                               $hubs = explode(',', $hub);
-                               if(count($hubs)) {
-                                       foreach($hubs as $h) {
-                                               $h = trim($h);
-                                               if(! strlen($h))
-                                                       continue;
-                                               subscribe_to_hub($h,$importer,$contact);
+                               // do it twice. Ensures that children of parents which may be later in the stream aren't tossed
+       
+                               consume_feed($xml,$importer,$contact,$hub,1,2);
+
+                               $hubmode = 'subscribe';
+                               if($contact['network'] === NETWORK_DFRN || $contact['blocked'] || $contact['readonly'])
+                                       $hubmode = 'unsubscribe';
+
+                               if((strlen($hub)) && ($hub_update) && ($contact['rel'] != CONTACT_IS_FOLLOWER)) {
+                                       logger('poller: hub ' . $hubmode . ' : ' . $hub . ' contact name : ' . $contact['name'] . ' local user : ' . $importer['name']);
+                                       $hubs = explode(',', $hub);
+                                       if(count($hubs)) {
+                                               foreach($hubs as $h) {
+                                                       $h = trim($h);
+                                                       if(! strlen($h))
+                                                               continue;
+                                                       subscribe_to_hub($h,$importer,$contact,$hubmode);
+                                               }
                                        }
                                }
                        }
@@ -319,9 +623,25 @@ function poller_run($argv, $argc){
                                intval($contact['id'])
                        );
 
+
+                       // load current friends if possible.
+
+                       if($contact['poco']) {  
+                               $r = q("SELECT count(*) as total from glink 
+                                       where `cid` = %d and updated > UTC_TIMESTAMP() - INTERVAL 1 DAY",
+                                       intval($contact['id'])
+                               );
+                       }
+                       if(count($r)) {
+                               if(! $r[0]['total']) {
+                                       poco_load($contact['id'],$importer_uid,$contact['poco']);
+                               }
+                       }
+
                        // loop - next contact
                }
        }
+
                
        return;
 }