3 require_once("boot.php");
6 function poller_run($argv, $argc){
14 @include(".htconfig.php");
15 require_once("dba.php");
16 $db = new dba($db_host, $db_user, $db_pass, $db_data);
17 unset($db_host, $db_user, $db_pass, $db_data);
21 require_once('include/session.php');
22 require_once('include/datetime.php');
23 require_once('library/simplepie/simplepie.inc');
24 require_once('include/items.php');
25 require_once('include/Contact.php');
26 require_once('include/email.php');
28 load_config('config');
29 load_config('system');
31 $a->set_baseurl(get_config('system','url'));
35 logger('poller: start');
37 // run queue delivery process in the background
39 proc_run('php',"include/queue.php");
41 // once daily run expire in background
43 $d1 = get_config('system','last_expire_day');
44 $d2 = intval(datetime_convert('UTC','UTC','now','d'));
46 if($d2 != intval($d1)) {
47 set_config('system','last_expire_day',$d2);
48 proc_run('php','include/expire.php');
52 q("DELETE FROM `cache` WHERE `updated` < '%s'",
53 dbesc(datetime_convert('UTC','UTC',"now - 30 days")));
61 if(($argc > 1) && ($argv[1] == 'force'))
64 if(($argc > 1) && ($argv[1] == 'restart')) {
66 $generation = intval($argv[2]);
71 if(($argc > 1) && intval($argv[1])) {
72 $manual_id = intval($argv[1]);
76 $sql_extra = (($manual_id) ? " AND `id` = $manual_id " : "");
80 $d = datetime_convert();
83 proc_run('php','include/cronhooks.php');
85 // Only poll from those with suitable relationships,
86 // and which have a polling address and ignore Diaspora since
87 // we are unable to match those posts with a Diaspora GUID and prevent duplicates.
89 $contacts = q("SELECT `id` FROM `contact`
90 WHERE ( `rel` = %d OR `rel` = %d ) AND `poll` != ''
93 AND `self` = 0 AND `blocked` = 0 AND `readonly` = 0 ORDER BY RAND()",
94 intval(CONTACT_IS_SHARING),
95 intval(CONTACT_IS_FRIEND),
96 dbesc(NETWORK_DIASPORA)
99 if(! count($contacts)) {
103 foreach($contacts as $c) {
105 $res = q("SELECT * FROM `contact` WHERE `id` = %d LIMIT 1",
109 if((! $res) || (! count($res)))
112 foreach($res as $contact) {
117 $contact['last-update'] = '0000-00-00 00:00:00';
119 if($contact['priority'] || $contact['subhub']) {
124 $t = $contact['last-update'];
126 // We should be getting everything via a hub. But just to be sure, let's check once a day.
127 // (You can make this more or less frequent if desired by setting 'pushpoll_frequency' appropriately)
128 // This also lets us update our subscription to the hub, and add or replace hubs in case it
129 // changed. We will only update hubs once a day, regardless of 'pushpoll_frequency'.
132 if($contact['subhub']) {
133 $interval = get_config('system','pushpoll_frequency');
134 $contact['priority'] = (($interval !== false) ? intval($interval) : 3);
137 if((datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 day")) || $force)
142 * Based on $contact['priority'], should we poll this site now? Or later?
145 switch ($contact['priority']) {
147 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 month"))
151 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 week"))
155 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 day"))
159 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 12 hour"))
164 if(datetime_convert('UTC','UTC', 'now') > datetime_convert('UTC','UTC', $t . " + 1 hour"))
168 if((! $update) && (! $force))
172 // Check to see if we are running out of memory - if so spawn a new process and kill this one
174 $avail_memory = return_bytes(ini_get('memory_limit'));
175 $memused = memory_get_peak_usage(true);
176 if(intval($avail_memory)) {
177 if(($memused / $avail_memory) > 0.95) {
178 if($generation + 1 > 10) {
179 logger('poller: maximum number of spawns exceeded. Terminating.');
182 logger('poller: memory exceeded. ' . $memused . ' bytes used. Spawning new poll.');
183 proc_run('php', 'include/poller.php', 'restart', (string) $generation + 1);
188 $importer_uid = $contact['uid'];
190 $r = q("SELECT * FROM `contact` WHERE `uid` = %d AND `self` = 1 LIMIT 1",
191 intval($importer_uid)
198 logger("poller: poll: IMPORTER: {$importer['name']}, CONTACT: {$contact['name']}");
200 $last_update = (($contact['last-update'] === '0000-00-00 00:00:00')
201 ? datetime_convert('UTC','UTC','now - 30 days', ATOM_TIME)
202 : datetime_convert('UTC','UTC',$contact['last-update'], ATOM_TIME)
205 if($contact['network'] === NETWORK_DFRN) {
207 $idtosend = $orig_id = (($contact['dfrn-id']) ? $contact['dfrn-id'] : $contact['issued-id']);
209 if(intval($contact['duplex']) && $contact['dfrn-id'])
210 $idtosend = '0:' . $orig_id;
211 if(intval($contact['duplex']) && $contact['issued-id'])
212 $idtosend = '1:' . $orig_id;
214 // they have permission to write to us. We already filtered this in the contact query.
217 $url = $contact['poll'] . '?dfrn_id=' . $idtosend
218 . '&dfrn_version=' . DFRN_PROTOCOL_VERSION
219 . '&type=data&last_update=' . $last_update
222 $handshake_xml = fetch_url($url);
224 logger('poller: handshake with url ' . $url . ' returns xml: ' . $handshake_xml, LOGGER_DATA);
227 if(! $handshake_xml) {
228 logger("poller: $url appears to be dead - marking for death ");
229 // dead connection - might be a transient event, or this might
230 // mean the software was uninstalled or the domain expired.
231 // Will keep trying for one month.
232 mark_for_death($contact);
234 // set the last-update so we don't keep polling
236 $r = q("UPDATE `contact` SET `last-update` = '%s' WHERE `id` = %d LIMIT 1",
237 dbesc(datetime_convert()),
238 intval($contact['id'])
244 if(! strstr($handshake_xml,'<?xml')) {
245 logger('poller: response from ' . $url . ' did not contain XML.');
246 $r = q("UPDATE `contact` SET `last-update` = '%s' WHERE `id` = %d LIMIT 1",
247 dbesc(datetime_convert()),
248 intval($contact['id'])
254 $res = parse_xml_string($handshake_xml);
256 if(intval($res->status) == 1) {
257 logger("poller: $url replied status 1 - marking for death ");
259 // we may not be friends anymore. Will keep trying for one month.
260 // set the last-update so we don't keep polling
262 $r = q("UPDATE `contact` SET `last-update` = '%s' WHERE `id` = %d LIMIT 1",
263 dbesc(datetime_convert()),
264 intval($contact['id'])
267 mark_for_death($contact);
270 if($contact['term-date'] != '0000-00-00 00:00:00') {
271 logger("poller: $url back from the dead - removing mark for death");
272 unmark_for_death($contact);
276 if((intval($res->status) != 0) || (! strlen($res->challenge)) || (! strlen($res->dfrn_id)))
281 $sent_dfrn_id = hex2bin((string) $res->dfrn_id);
282 $challenge = hex2bin((string) $res->challenge);
286 if(($contact['duplex']) && strlen($contact['prvkey'])) {
287 openssl_private_decrypt($sent_dfrn_id,$final_dfrn_id,$contact['prvkey']);
288 openssl_private_decrypt($challenge,$postvars['challenge'],$contact['prvkey']);
291 openssl_public_decrypt($sent_dfrn_id,$final_dfrn_id,$contact['pubkey']);
292 openssl_public_decrypt($challenge,$postvars['challenge'],$contact['pubkey']);
295 $final_dfrn_id = substr($final_dfrn_id, 0, strpos($final_dfrn_id, '.'));
297 if(strpos($final_dfrn_id,':') == 1)
298 $final_dfrn_id = substr($final_dfrn_id,2);
300 if($final_dfrn_id != $orig_id) {
301 logger('poller: ID did not decode: ' . $contact['id'] . ' orig: ' . $orig_id . ' final: ' . $final_dfrn_id);
302 // did not decode properly - cannot trust this site
306 $postvars['dfrn_id'] = $idtosend;
307 $postvars['dfrn_version'] = DFRN_PROTOCOL_VERSION;
308 $postvars['perm'] = 'rw';
310 $xml = post_url($contact['poll'],$postvars);
312 elseif(($contact['network'] === NETWORK_OSTATUS)
313 || ($contact['network'] === NETWORK_DIASPORA)
314 || ($contact['network'] === NETWORK_FEED) ) {
316 // Upgrading DB fields from an older Friendika version
317 // Will only do this once per notify-enabled OStatus contact
318 // or if relationship changes
320 $stat_writeable = ((($contact['notify']) && ($contact['rel'] == CONTACT_IS_FOLLOWER || $contact['rel'] == CONTACT_IS_FRIEND)) ? 1 : 0);
322 if($stat_writeable != $contact['writable']) {
323 q("UPDATE `contact` SET `writable` = %d WHERE `id` = %d LIMIT 1",
324 intval($stat_writeable),
325 intval($contact['id'])
329 // Are we allowed to import from this person?
331 if($contact['rel'] == CONTACT_IS_FOLLOWER || $contact['blocked'] || $contact['readonly'])
334 $xml = fetch_url($contact['poll']);
336 elseif($contact['network'] === NETWORK_MAIL) {
338 $mail_disabled = ((function_exists('imap_open') && (! get_config('system','imap_disabled'))) ? 0 : 1);
343 $x = q("SELECT `prvkey` FROM `user` WHERE `uid` = %d LIMIT 1",
344 intval($importer_uid)
346 $mailconf = q("SELECT * FROM `mailacct` WHERE `server` != '' AND `uid` = %d LIMIT 1",
347 intval($importer_uid)
349 if(count($x) && count($mailconf)) {
350 $mailbox = construct_mailbox_name($mailconf[0]);
352 openssl_private_decrypt(hex2bin($mailconf[0]['pass']),$password,$x[0]['prvkey']);
353 $mbox = email_connect($mailbox,$mailconf[0]['user'],$password);
356 q("UPDATE `mailacct` SET `last_check` = '%s' WHERE `id` = %d AND `uid` = %d LIMIT 1",
357 dbesc(datetime_convert()),
358 intval($mailconf[0]['id']),
359 intval($importer_uid)
365 $msgs = email_poll($mbox,$contact['addr']);
368 foreach($msgs as $msg_uid) {
370 $meta = email_msg_meta($mbox,$msg_uid);
371 $headers = email_msg_headers($mbox,$msg_uid);
373 // look for a 'references' header and try and match with a parent item we have locally.
375 $raw_refs = ((x($headers,'references')) ? str_replace("\t",'',$headers['references']) : '');
376 $datarray['uri'] = trim($meta->message_id,'<>');
379 $refs_arr = explode(' ', $raw_refs);
380 if(count($refs_arr)) {
381 for($x = 0; $x < count($refs_arr); $x ++)
382 $refs_arr[$x] = "'" . str_replace(array('<','>',' '),array('','',''),dbesc($refs_arr[$x])) . "'";
384 $qstr = implode(',',$refs_arr);
385 $r = q("SELECT `uri` , `parent-uri` FROM `item` WHERE `uri` IN ( $qstr ) AND `uid` = %d LIMIT 1",
386 intval($importer_uid)
389 $datarray['parent-uri'] = $r[0]['uri'];
393 if(! x($datarray,'parent-uri'))
394 $datarray['parent-uri'] = $datarray['uri'];
396 // Have we seen it before?
397 $r = q("SELECT * FROM `item` WHERE `uid` = %d AND `uri` = '%s' LIMIT 1",
398 intval($importer_uid),
399 dbesc($datarray['uri'])
403 if($meta->deleted && ! $r[0]['deleted']) {
404 q("UPDATE `item` SET `deleted` = 1, `changed` = '%s' WHERE `id` = %d LIMIT 1",
405 dbesc(datetime_convert()),
411 $datarray['title'] = notags(trim($meta->subject));
412 $datarray['created'] = datetime_convert('UTC','UTC',$meta->date);
414 $r = email_get_msg($mbox,$msg_uid);
417 $datarray['body'] = escape_tags($r['body']);
419 // some mailing lists have the original author as 'from' - add this sender info to msg body.
420 // todo: adding a gravatar for the original author would be cool
422 if(! stristr($meta->from,$contact['addr']))
423 $datarray['body'] = t('From: ') . escape_tags($meta->from) . "\n\n" . $datarray['body'];
425 $datarray['uid'] = $importer_uid;
426 $datarray['contact-id'] = $contact['id'];
427 if($datarray['parent-uri'] === $datarray['uri'])
428 $datarray['private'] = 1;
429 if(! get_pconfig($importer_uid,'system','allow_public_email_replies')) {
430 $datarray['private'] = 1;
431 $datarray['allow_cid'] = '<' . $contact['id'] . '>';
433 $datarray['author-name'] = $contact['name'];
434 $datarray['author-link'] = 'mailbox';
435 $datarray['author-avatar'] = $contact['photo'];
437 $stored_item = item_store($datarray);
438 q("UPDATE `item` SET `last-child` = 0 WHERE `parent-uri` = '%s' AND `uid` = %d",
439 dbesc($datarray['parent-uri']),
440 intval($importer_uid)
442 q("UPDATE `item` SET `last-child` = 1 WHERE `id` = %d LIMIT 1",
451 elseif($contact['network'] === NETWORK_FACEBOOK) {
452 // This is picked up by the Facebook plugin on a cron hook.
457 logger('poller: received xml : ' . $xml, LOGGER_DATA);
459 if(! strstr($xml,'<?xml')) {
460 logger('poller: post_handshake: response from ' . $url . ' did not contain XML.');
461 $r = q("UPDATE `contact` SET `last-update` = '%s' WHERE `id` = %d LIMIT 1",
462 dbesc(datetime_convert()),
463 intval($contact['id'])
469 consume_feed($xml,$importer,$contact,$hub,1, true);
471 // do it twice. Ensures that children of parents which may be later in the stream aren't tossed
473 consume_feed($xml,$importer,$contact,$hub,1);
476 if((strlen($hub)) && ($hub_update) && (($contact['rel'] == CONTACT_IS_FRIEND) || (($contact['network'] === NETWORK_OSTATUS) && (! $contact['readonly'])))) {
477 logger('poller: subscribing to hub(s) : ' . $hub . ' contact name : ' . $contact['name'] . ' local user : ' . $importer['name']);
478 $hubs = explode(',', $hub);
480 foreach($hubs as $h) {
484 subscribe_to_hub($h,$importer,$contact);
490 $updated = datetime_convert();
492 $r = q("UPDATE `contact` SET `last-update` = '%s', `success_update` = '%s' WHERE `id` = %d LIMIT 1",
495 intval($contact['id'])
498 // loop - next contact
506 if (array_search(__file__,get_included_files())===0){
507 poller_run($argv,$argc);