3 * @file include/socgraph.php
5 * @todo Move GNU Social URL schemata (http://server.tld/user/number) to http://server.tld/username
6 * @todo Fetch profile data from profile page for Redmatrix users
7 * @todo Detect if it is a forum
10 require_once('include/datetime.php');
11 require_once("include/Scrape.php");
12 require_once("include/html2bbcode.php");
18 * Given a contact-id (minimum), load the PortableContacts friend list for that contact,
19 * and add the entries to the gcontact (Global Contact) table, or update existing entries
20 * if anything (name or photo) has changed.
21 * We use normalised urls for comparison which ignore http vs https and www.domain vs domain
23 * Once the global contact is stored add (if necessary) the contact linkage which associates
24 * the given uid, cid to the global contact entry. There can be many uid/cid combinations
25 * pointing to the same global contact id.
32 function poco_load($cid,$uid = 0,$zcid = 0,$url = null) {
37 if((! $url) || (! $uid)) {
38 $r = q("select `poco`, `uid` from `contact` where `id` = %d limit 1",
53 $url = $url . (($uid) ? '/@me/@all?fields=displayName,urls,photos,updated,network,aboutMe,currentLocation,tags,gender,generation' : '?fields=displayName,urls,photos,updated,network,aboutMe,currentLocation,tags,gender,generation') ;
55 logger('poco_load: ' . $url, LOGGER_DEBUG);
59 logger('poco_load: returns ' . $s, LOGGER_DATA);
61 logger('poco_load: return code: ' . $a->get_curl_code(), LOGGER_DEBUG);
63 if(($a->get_curl_code() > 299) || (! $s))
68 logger('poco_load: json: ' . print_r($j,true),LOGGER_DATA);
70 if(! isset($j->entry))
74 foreach($j->entry as $entry) {
82 $updated = '0000-00-00 00:00:00';
89 $name = $entry->displayName;
91 if(isset($entry->urls)) {
92 foreach($entry->urls as $url) {
93 if($url->type == 'profile') {
94 $profile_url = $url->value;
97 if($url->type == 'webfinger') {
98 $connect_url = str_replace('acct:' , '', $url->value);
103 if(isset($entry->photos)) {
104 foreach($entry->photos as $photo) {
105 if($photo->type == 'profile') {
106 $profile_photo = $photo->value;
112 if(isset($entry->updated))
113 $updated = date("Y-m-d H:i:s", strtotime($entry->updated));
115 if(isset($entry->network))
116 $network = $entry->network;
118 if(isset($entry->currentLocation))
119 $location = $entry->currentLocation;
121 if(isset($entry->aboutMe))
122 $about = html2bbcode($entry->aboutMe);
124 if(isset($entry->gender))
125 $gender = $entry->gender;
127 if(isset($entry->generation) AND ($entry->generation > 0))
128 $generation = ++$entry->generation;
130 if(isset($entry->tags))
131 foreach($entry->tags as $tag)
132 $keywords = implode(", ", $tag);
134 // If you query a Friendica server for its profiles, the network has to be Friendica
135 /// TODO It could also be a Redmatrix server
137 // $network = NETWORK_DFRN;
139 poco_check($profile_url, $name, $network, $profile_photo, $about, $location, $gender, $keywords, $connect_url, $updated, $generation, $cid, $uid, $zcid);
141 // Update the Friendica contacts. Diaspora is doing it via a message. (See include/diaspora.php)
142 if (($location != "") OR ($about != "") OR ($keywords != "") OR ($gender != ""))
143 q("UPDATE `contact` SET `location` = '%s', `about` = '%s', `keywords` = '%s', `gender` = '%s'
144 WHERE `nurl` = '%s' AND NOT `self` AND `network` = '%s'",
149 dbesc(normalise_link($profile_url)),
150 dbesc(NETWORK_DFRN));
152 logger("poco_load: loaded $total entries",LOGGER_DEBUG);
154 q("DELETE FROM `glink` WHERE `cid` = %d AND `uid` = %d AND `zcid` = %d AND `updated` < UTC_TIMESTAMP - INTERVAL 2 DAY",
162 function poco_check($profile_url, $name, $network, $profile_photo, $about, $location, $gender, $keywords, $connect_url, $updated, $generation, $cid = 0, $uid = 0, $zcid = 0) {
168 // 1: Profiles on this server
169 // 2: Contacts of profiles on this server
170 // 3: Contacts of contacts of profiles on this server
175 $alternate = poco_alternate_ostatus_url($profile_url);
177 if ($profile_url == "")
180 $urlparts = parse_url($profile_url);
181 if (!isset($urlparts["scheme"]))
184 if (in_array($urlparts["host"], array("www.facebook.com", "facebook.com", "twitter.com",
185 "identi.ca", "alpha.app.net")))
188 $orig_updated = $updated;
190 // Don't store the statusnet connector as network
191 // We can't simply set this to NETWORK_OSTATUS since the connector could have fetched posts from friendica as well
192 if ($network == NETWORK_STATUSNET)
195 // The global contacts should contain the original picture, not the cached one
196 if (($generation != 1) AND stristr(normalise_link($profile_photo), normalise_link($a->get_baseurl()."/photo/")))
199 $r = q("SELECT `network` FROM `contact` WHERE `nurl` = '%s' AND `network` != '' AND `network` != '%s' LIMIT 1",
200 dbesc(normalise_link($profile_url)), dbesc(NETWORK_STATUSNET)
203 $network = $r[0]["network"];
205 if (($network == "") OR ($network == NETWORK_OSTATUS)) {
206 $r = q("SELECT `network`, `url` FROM `contact` WHERE `alias` IN ('%s', '%s') AND `network` != '' AND `network` != '%s' LIMIT 1",
207 dbesc($profile_url), dbesc(normalise_link($profile_url)), dbesc(NETWORK_STATUSNET)
210 $network = $r[0]["network"];
211 //$profile_url = $r[0]["url"];
215 $x = q("SELECT * FROM `gcontact` WHERE `nurl` = '%s' LIMIT 1",
216 dbesc(normalise_link($profile_url))
220 if (($network == "") AND ($x[0]["network"] != NETWORK_STATUSNET))
221 $network = $x[0]["network"];
223 if ($updated == "0000-00-00 00:00:00")
224 $updated = $x[0]["updated"];
226 $created = $x[0]["created"];
227 $server_url = $x[0]["server_url"];
228 $nick = $x[0]["nick"];
229 $addr = $x[0]["addr"];
231 $created = "0000-00-00 00:00:00";
234 $urlparts = parse_url($profile_url);
235 $nick = end(explode("/", $urlparts["path"]));
239 if ((($network == "") OR ($name == "") OR ($addr == "") OR ($profile_photo == "") OR ($server_url == "") OR $alternate)
240 AND poco_reachable($profile_url, $server_url, $network, false)) {
241 $data = probe_url($profile_url);
243 $orig_profile = $profile_url;
245 $network = $data["network"];
246 $name = $data["name"];
247 $nick = $data["nick"];
248 $addr = $data["addr"];
249 $profile_url = $data["url"];
250 $profile_photo = $data["photo"];
251 $server_url = $data["baseurl"];
253 if ($alternate AND ($network == NETWORK_OSTATUS)) {
254 // Delete the old entry - if it exists
255 $r = q("SELECT `id` FROM `gcontact` WHERE `nurl` = '%s'", dbesc(normalise_link($orig_profile)));
257 q("DELETE FROM `gcontact` WHERE `nurl` = '%s'", dbesc(normalise_link($orig_profile)));
258 q("DELETE FROM `glink` WHERE `gcid` = %d", intval($r[0]["id"]));
261 // possibly create a new entry
262 poco_check($profile_url, $name, $network, $profile_photo, $about, $location, $gender, $keywords, $connect_url, $updated, $generation, $cid, $uid, $zcid);
266 if ($alternate AND ($network == NETWORK_OSTATUS))
269 if (count($x) AND ($x[0]["network"] == "") AND ($network != "")) {
270 q("UPDATE `gcontact` SET `network` = '%s' WHERE `nurl` = '%s'",
272 dbesc(normalise_link($profile_url))
276 if (($name == "") OR ($profile_photo == ""))
279 if (!in_array($network, array(NETWORK_DFRN, NETWORK_OSTATUS, NETWORK_DIASPORA)))
282 logger("profile-check generation: ".$generation." Network: ".$network." URL: ".$profile_url." name: ".$name." avatar: ".$profile_photo, LOGGER_DEBUG);
284 poco_check_server($server_url, $network);
289 if (($location == "") AND ($x[0]['location'] != ""))
290 $location = $x[0]['location'];
292 if (($about == "") AND ($x[0]['about'] != ""))
293 $about = $x[0]['about'];
295 if (($gender == "") AND ($x[0]['gender'] != ""))
296 $gender = $x[0]['gender'];
298 if (($keywords == "") AND ($x[0]['keywords'] != ""))
299 $keywords = $x[0]['keywords'];
301 if (($addr == "") AND ($x[0]['addr'] != ""))
302 $addr = $x[0]['addr'];
304 if (($generation == 0) AND ($x[0]['generation'] > 0))
305 $generation = $x[0]['generation'];
307 if($x[0]['name'] != $name || $x[0]['photo'] != $profile_photo || $x[0]['updated'] < $updated) {
308 q("UPDATE `gcontact` SET `name` = '%s', `addr` = '%s', `network` = '%s', `photo` = '%s', `connect` = '%s', `url` = '%s', `server_url` = '%s',
309 `updated` = '%s', `location` = '%s', `about` = '%s', `keywords` = '%s', `gender` = '%s', `generation` = %d
310 WHERE (`generation` >= %d OR `generation` = 0) AND `nurl` = '%s'",
314 dbesc($profile_photo),
325 dbesc(normalise_link($profile_url))
329 q("INSERT INTO `gcontact` (`name`, `nick`, `addr`, `network`, `url`, `nurl`, `photo`, `connect`, `server_url`, `created`, `updated`, `location`, `about`, `keywords`, `gender`, `generation`)
330 VALUES ('%s', '%s', '%s', '%s', '%s', '%s', '%s', '%s', '%s', '%s', '%s', '%s', '%s', '%s', '%s', %d)",
336 dbesc(normalise_link($profile_url)),
337 dbesc($profile_photo),
340 dbesc(datetime_convert()),
348 $x = q("SELECT * FROM `gcontact` WHERE `nurl` = '%s' LIMIT 1",
349 dbesc(normalise_link($profile_url))
358 $r = q("SELECT * FROM `glink` WHERE `cid` = %d AND `uid` = %d AND `gcid` = %d AND `zcid` = %d LIMIT 1",
365 q("INSERT INTO `glink` (`cid`,`uid`,`gcid`,`zcid`, `updated`) VALUES (%d,%d,%d,%d, '%s') ",
370 dbesc(datetime_convert())
373 q("UPDATE `glink` SET `updated` = '%s' WHERE `cid` = %d AND `uid` = %d AND `gcid` = %d AND `zcid` = %d",
374 dbesc(datetime_convert()),
382 // For unknown reasons there are sometimes duplicates
383 q("DELETE FROM `gcontact` WHERE `nurl` = '%s' AND `id` != %d AND
384 NOT EXISTS (SELECT `gcid` FROM `glink` WHERE `gcid` = `gcontact`.`id`)",
385 dbesc(normalise_link($profile_url)),
392 function poco_reachable($profile, $server = "", $network = "", $force = false) {
395 $server = poco_detect_server($profile);
400 return poco_check_server($server, $network, $force);
403 function poco_detect_server($profile) {
405 // Try to detect the server path based upon some known standard paths
408 if ($server_url == "") {
409 $friendica = preg_replace("=(https?://)(.*)/profile/(.*)=ism", "$1$2", $profile);
410 if ($friendica != $profile) {
411 $server_url = $friendica;
412 $network = NETWORK_DFRN;
416 if ($server_url == "") {
417 $diaspora = preg_replace("=(https?://)(.*)/u/(.*)=ism", "$1$2", $profile);
418 if ($diaspora != $profile) {
419 $server_url = $diaspora;
420 $network = NETWORK_DIASPORA;
424 if ($server_url == "") {
425 $red = preg_replace("=(https?://)(.*)/channel/(.*)=ism", "$1$2", $profile);
426 if ($red != $profile) {
428 $network = NETWORK_DIASPORA;
435 function poco_alternate_ostatus_url($url) {
436 return(preg_match("=https?://.+/user/\d+=ism", $url, $matches));
439 function poco_last_updated($profile, $force = false) {
441 $gcontacts = q("SELECT * FROM `gcontact` WHERE `nurl` = '%s'",
442 dbesc(normalise_link($profile)));
444 if ($gcontacts[0]["created"] == "0000-00-00 00:00:00")
445 q("UPDATE `gcontact` SET `created` = '%s' WHERE `nurl` = '%s'",
446 dbesc(datetime_convert()), dbesc(normalise_link($profile)));
448 if ($gcontacts[0]["server_url"] != "")
449 $server_url = $gcontacts[0]["server_url"];
451 $server_url = poco_detect_server($profile);
453 if ($server_url != "") {
454 if (!poco_check_server($server_url, $gcontacts[0]["network"], $force)) {
457 q("UPDATE `gcontact` SET `last_failure` = '%s' WHERE `nurl` = '%s'",
458 dbesc(datetime_convert()), dbesc(normalise_link($profile)));
463 q("UPDATE `gcontact` SET `server_url` = '%s' WHERE `nurl` = '%s'",
464 dbesc($server_url), dbesc(normalise_link($profile)));
467 if (in_array($gcontacts[0]["network"], array("", NETWORK_FEED))) {
468 $server = q("SELECT `network` FROM `gserver` WHERE `nurl` = '%s' AND `network` != ''",
469 dbesc(normalise_link($server_url)));
472 q("UPDATE `gcontact` SET `network` = '%s' WHERE `nurl` = '%s'",
473 dbesc($server[0]["network"]), dbesc(normalise_link($profile)));
478 // noscrape is really fast so we don't cache the call.
479 if (($gcontacts[0]["server_url"] != "") AND ($gcontacts[0]["nick"] != "")) {
481 // Use noscrape if possible
482 $server = q("SELECT `noscrape` FROM `gserver` WHERE `nurl` = '%s' AND `noscrape` != ''", dbesc(normalise_link($gcontacts[0]["server_url"])));
485 $noscraperet = z_fetch_url($server[0]["noscrape"]."/".$gcontacts[0]["nick"]);
487 if ($noscraperet["success"] AND ($noscraperet["body"] != "")) {
489 $noscrape = json_decode($noscraperet["body"], true);
491 if (($noscrape["fn"] != "") AND ($noscrape["fn"] != $gcontacts[0]["name"]))
492 q("UPDATE `gcontact` SET `name` = '%s' WHERE `nurl` = '%s'",
493 dbesc($noscrape["fn"]), dbesc(normalise_link($profile)));
495 if (($noscrape["photo"] != "") AND ($noscrape["photo"] != $gcontacts[0]["photo"]))
496 q("UPDATE `gcontact` SET `photo` = '%s' WHERE `nurl` = '%s'",
497 dbesc($noscrape["photo"]), dbesc(normalise_link($profile)));
499 if (($noscrape["updated"] != "") AND ($noscrape["updated"] != $gcontacts[0]["updated"]))
500 q("UPDATE `gcontact` SET `updated` = '%s' WHERE `nurl` = '%s'",
501 dbesc($noscrape["updated"]), dbesc(normalise_link($profile)));
503 if (($noscrape["gender"] != "") AND ($noscrape["gender"] != $gcontacts[0]["gender"]))
504 q("UPDATE `gcontact` SET `gender` = '%s' WHERE `nurl` = '%s'",
505 dbesc($noscrape["gender"]), dbesc(normalise_link($profile)));
507 if (($noscrape["pdesc"] != "") AND ($noscrape["pdesc"] != $gcontacts[0]["about"]))
508 q("UPDATE `gcontact` SET `about` = '%s' WHERE `nurl` = '%s'",
509 dbesc($noscrape["pdesc"]), dbesc(normalise_link($profile)));
511 if (($noscrape["about"] != "") AND ($noscrape["about"] != $gcontacts[0]["about"]))
512 q("UPDATE `gcontact` SET `about` = '%s' WHERE `nurl` = '%s'",
513 dbesc($noscrape["about"]), dbesc(normalise_link($profile)));
515 if (isset($noscrape["comm"]) AND ($noscrape["comm"] != $gcontacts[0]["community"]))
516 q("UPDATE `gcontact` SET `community` = %d WHERE `nurl` = '%s'",
517 intval($noscrape["comm"]), dbesc(normalise_link($profile)));
519 if (isset($noscrape["tags"]))
520 $keywords = implode(" ", $noscrape["tags"]);
524 if (($keywords != "") AND ($keywords != $gcontacts[0]["keywords"]))
525 q("UPDATE `gcontact` SET `keywords` = '%s' WHERE `nurl` = '%s'",
526 dbesc($keywords), dbesc(normalise_link($profile)));
528 $location = $noscrape["locality"];
530 if ($noscrape["region"] != "") {
534 $location .= $noscrape["region"];
537 if ($noscrape["country-name"] != "") {
541 $location .= $noscrape["country-name"];
544 if (($location != "") AND ($location != $gcontacts[0]["location"]))
545 q("UPDATE `gcontact` SET `location` = '%s' WHERE `nurl` = '%s'",
546 dbesc($location), dbesc(normalise_link($profile)));
548 // If we got data from noscrape then mark the contact as reachable
549 if (is_array($noscrape) AND count($noscrape))
550 q("UPDATE `gcontact` SET `last_contact` = '%s' WHERE `nurl` = '%s'",
551 dbesc(datetime_convert()), dbesc(normalise_link($profile)));
553 return $noscrape["updated"];
558 // If we only can poll the feed, then we only do this once a while
559 if (!$force AND !poco_do_update($gcontacts[0]["created"], $gcontacts[0]["updated"], $gcontacts[0]["last_failure"], $gcontacts[0]["last_contact"]))
560 return $gcontacts[0]["updated"];
562 $data = probe_url($profile);
564 // Is the profile link the alternate OStatus link notation? (http://domain.tld/user/4711)
565 // Then check the other link and delete this one
566 if (($data["network"] == NETWORK_OSTATUS) AND poco_alternate_ostatus_url($profile) AND
567 (normalise_link($profile) == normalise_link($data["alias"])) AND
568 (normalise_link($profile) != normalise_link($data["url"]))) {
570 // Delete the old entry
571 q("DELETE FROM `gcontact` WHERE `nurl` = '%s'", dbesc(normalise_link($profile)));
572 q("DELETE FROM `glink` WHERE `gcid` = %d", intval($gcontacts[0]["id"]));
574 poco_check($data["url"], $data["name"], $data["network"], $data["photo"], $gcontacts[0]["about"], $gcontacts[0]["location"],
575 $gcontacts[0]["gender"], $gcontacts[0]["keywords"], $data["addr"], $gcontacts[0]["updated"], $gcontacts[0]["generation"]);
577 poco_last_updated($data["url"], $force);
582 if (($data["poll"] == "") OR (in_array($data["network"], array(NETWORK_FEED, NETWORK_PHANTOM)))) {
583 q("UPDATE `gcontact` SET `last_failure` = '%s' WHERE `nurl` = '%s'",
584 dbesc(datetime_convert()), dbesc(normalise_link($profile)));
588 if (($data["name"] != "") AND ($data["name"] != $gcontacts[0]["name"]))
589 q("UPDATE `gcontact` SET `name` = '%s' WHERE `nurl` = '%s'",
590 dbesc($data["name"]), dbesc(normalise_link($profile)));
592 if (($data["nick"] != "") AND ($data["nick"] != $gcontacts[0]["nick"]))
593 q("UPDATE `gcontact` SET `nick` = '%s' WHERE `nurl` = '%s'",
594 dbesc($data["nick"]), dbesc(normalise_link($profile)));
596 if (($data["addr"] != "") AND ($data["addr"] != $gcontacts[0]["connect"]))
597 q("UPDATE `gcontact` SET `connect` = '%s' WHERE `nurl` = '%s'",
598 dbesc($data["addr"]), dbesc(normalise_link($profile)));
600 if (($data["photo"] != "") AND ($data["photo"] != $gcontacts[0]["photo"]))
601 q("UPDATE `gcontact` SET `photo` = '%s' WHERE `nurl` = '%s'",
602 dbesc($data["photo"]), dbesc(normalise_link($profile)));
604 if (($data["baseurl"] != "") AND ($data["baseurl"] != $gcontacts[0]["server_url"]))
605 q("UPDATE `gcontact` SET `server_url` = '%s' WHERE `nurl` = '%s'",
606 dbesc($data["baseurl"]), dbesc(normalise_link($profile)));
608 $feedret = z_fetch_url($data["poll"]);
610 if (!$feedret["success"]) {
611 q("UPDATE `gcontact` SET `last_failure` = '%s' WHERE `nurl` = '%s'",
612 dbesc(datetime_convert()), dbesc(normalise_link($profile)));
616 $doc = new DOMDocument();
617 @$doc->loadXML($feedret["body"]);
619 $xpath = new DomXPath($doc);
620 $xpath->registerNamespace('atom', "http://www.w3.org/2005/Atom");
622 $entries = $xpath->query('/atom:feed/atom:entry');
626 foreach ($entries AS $entry) {
627 $published = $xpath->query('atom:published/text()', $entry)->item(0)->nodeValue;
628 $updated = $xpath->query('atom:updated/text()', $entry)->item(0)->nodeValue;
630 if ($last_updated < $published)
631 $last_updated = $published;
633 if ($last_updated < $updated)
634 $last_updated = $updated;
637 // Maybe there aren't any entries. Then check if it is a valid feed
638 if ($last_updated == "")
639 if ($xpath->query('/atom:feed')->length > 0)
640 $last_updated = "0000-00-00 00:00:00";
642 q("UPDATE `gcontact` SET `updated` = '%s', `last_contact` = '%s' WHERE `nurl` = '%s'",
643 dbesc($last_updated), dbesc(datetime_convert()), dbesc(normalise_link($profile)));
645 if (($gcontacts[0]["generation"] == 0))
646 q("UPDATE `gcontact` SET `generation` = 9 WHERE `nurl` = '%s'",
647 dbesc(normalise_link($profile)));
649 return($last_updated);
652 function poco_do_update($created, $updated, $last_failure, $last_contact) {
653 $now = strtotime(datetime_convert());
655 if ($updated > $last_contact)
656 $contact_time = strtotime($updated);
658 $contact_time = strtotime($last_contact);
660 $failure_time = strtotime($last_failure);
661 $created_time = strtotime($created);
663 // If there is no "created" time then use the current time
664 if ($created_time <= 0)
665 $created_time = $now;
667 // If the last contact was less than 24 hours then don't update
668 if (($now - $contact_time) < (60 * 60 * 24))
671 // If the last failure was less than 24 hours then don't update
672 if (($now - $failure_time) < (60 * 60 * 24))
675 // If the last contact was less than a week ago and the last failure is older than a week then don't update
676 //if ((($now - $contact_time) < (60 * 60 * 24 * 7)) AND ($contact_time > $failure_time))
679 // If the last contact time was more than a week ago and the contact was created more than a week ago, then only try once a week
680 if ((($now - $contact_time) > (60 * 60 * 24 * 7)) AND (($now - $created_time) > (60 * 60 * 24 * 7)) AND (($now - $failure_time) < (60 * 60 * 24 * 7)))
683 // If the last contact time was more than a month ago and the contact was created more than a month ago, then only try once a month
684 if ((($now - $contact_time) > (60 * 60 * 24 * 30)) AND (($now - $created_time) > (60 * 60 * 24 * 30)) AND (($now - $failure_time) < (60 * 60 * 24 * 30)))
690 function poco_to_boolean($val) {
691 if (($val == "true") OR ($val == 1))
693 if (($val == "false") OR ($val == 0))
699 function poco_check_server($server_url, $network = "", $force = false) {
701 if ($server_url == "")
704 $servers = q("SELECT * FROM `gserver` WHERE `nurl` = '%s'", dbesc(normalise_link($server_url)));
707 if ($servers[0]["created"] == "0000-00-00 00:00:00")
708 q("UPDATE `gserver` SET `created` = '%s' WHERE `nurl` = '%s'",
709 dbesc(datetime_convert()), dbesc(normalise_link($server_url)));
711 $poco = $servers[0]["poco"];
712 $noscrape = $servers[0]["noscrape"];
715 $network = $servers[0]["network"];
717 $last_contact = $servers[0]["last_contact"];
718 $last_failure = $servers[0]["last_failure"];
719 $version = $servers[0]["version"];
720 $platform = $servers[0]["platform"];
721 $site_name = $servers[0]["site_name"];
722 $info = $servers[0]["info"];
723 $register_policy = $servers[0]["register_policy"];
725 if (!$force AND !poco_do_update($servers[0]["created"], "", $last_failure, $last_contact)) {
726 logger("Use cached data for server ".$server_url, LOGGER_DEBUG);
727 return ($last_contact >= $last_failure);
736 $register_policy = -1;
738 $last_contact = "0000-00-00 00:00:00";
739 $last_failure = "0000-00-00 00:00:00";
741 logger("Server ".$server_url." is outdated or unknown. Start discovery. Force: ".$force." Created: ".$servers[0]["created"]." Failure: ".$last_failure." Contact: ".$last_contact, LOGGER_DEBUG);
744 $orig_last_failure = $last_failure;
746 // Check if the page is accessible via SSL.
747 $server_url = str_replace("http://", "https://", $server_url);
748 $serverret = z_fetch_url($server_url."/.well-known/host-meta");
750 // Maybe the page is unencrypted only?
751 $xmlobj = @simplexml_load_string($serverret["body"],'SimpleXMLElement',0, "http://docs.oasis-open.org/ns/xri/xrd-1.0");
752 if (!$serverret["success"] OR ($serverret["body"] == "") OR (@sizeof($xmlobj) == 0) OR !is_object($xmlobj)) {
753 $server_url = str_replace("https://", "http://", $server_url);
754 $serverret = z_fetch_url($server_url."/.well-known/host-meta");
756 $xmlobj = @simplexml_load_string($serverret["body"],'SimpleXMLElement',0, "http://docs.oasis-open.org/ns/xri/xrd-1.0");
759 if (!$serverret["success"] OR ($serverret["body"] == "") OR (sizeof($xmlobj) == 0) OR !is_object($xmlobj)) {
760 // Workaround for bad configured servers (known nginx problem)
761 if ($serverret["debug"]["http_code"] != "403") {
762 $last_failure = datetime_convert();
765 } elseif ($network == NETWORK_DIASPORA)
766 $last_contact = datetime_convert();
770 $serverret = z_fetch_url($server_url);
772 $lines = explode("\n",$serverret["header"]);
774 foreach($lines as $line) {
776 if(stristr($line,'X-Diaspora-Version:')) {
777 $platform = "Diaspora";
778 $version = trim(str_replace("X-Diaspora-Version:", "", $line));
779 $version = trim(str_replace("x-diaspora-version:", "", $version));
780 $network = NETWORK_DIASPORA;
786 // Test for Statusnet
787 // Will also return data for Friendica and GNU Social - but it will be overwritten later
788 // The "not implemented" is a special treatment for really, really old Friendica versions
789 $serverret = z_fetch_url($server_url."/api/statusnet/version.json");
790 if ($serverret["success"] AND ($serverret["body"] != '{"error":"not implemented"}') AND ($serverret["body"] != '') AND (strlen($serverret["body"]) < 250)) {
791 $platform = "StatusNet";
792 $version = trim($serverret["body"], '"');
793 $network = NETWORK_OSTATUS;
796 // Test for GNU Social
797 $serverret = z_fetch_url($server_url."/api/gnusocial/version.json");
798 if ($serverret["success"] AND ($serverret["body"] != '{"error":"not implemented"}') AND ($serverret["body"] != '') AND (strlen($serverret["body"]) < 250)) {
799 $platform = "GNU Social";
800 $version = trim($serverret["body"], '"');
801 $network = NETWORK_OSTATUS;
804 $serverret = z_fetch_url($server_url."/api/statusnet/config.json");
805 if ($serverret["success"]) {
806 $data = json_decode($serverret["body"]);
808 if (isset($data->site->server)) {
809 $last_contact = datetime_convert();
811 if (isset($data->site->hubzilla)) {
812 $platform = $data->site->hubzilla->PLATFORM_NAME;
813 $version = $data->site->hubzilla->RED_VERSION;
814 $network = NETWORK_DIASPORA;
816 if (isset($data->site->redmatrix)) {
817 if (isset($data->site->redmatrix->PLATFORM_NAME))
818 $platform = $data->site->redmatrix->PLATFORM_NAME;
819 elseif (isset($data->site->redmatrix->RED_PLATFORM))
820 $platform = $data->site->redmatrix->RED_PLATFORM;
822 $version = $data->site->redmatrix->RED_VERSION;
823 $network = NETWORK_DIASPORA;
825 if (isset($data->site->friendica)) {
826 $platform = $data->site->friendica->FRIENDICA_PLATFORM;
827 $version = $data->site->friendica->FRIENDICA_VERSION;
828 $network = NETWORK_DFRN;
831 $site_name = $data->site->name;
833 $data->site->closed = poco_to_boolean($data->site->closed);
834 $data->site->private = poco_to_boolean($data->site->private);
835 $data->site->inviteonly = poco_to_boolean($data->site->inviteonly);
837 if (!$data->site->closed AND !$data->site->private and $data->site->inviteonly)
838 $register_policy = REGISTER_APPROVE;
839 elseif (!$data->site->closed AND !$data->site->private)
840 $register_policy = REGISTER_OPEN;
842 $register_policy = REGISTER_CLOSED;
847 // Query statistics.json. Optional package for Diaspora, Friendica and Redmatrix
849 $serverret = z_fetch_url($server_url."/statistics.json");
850 if ($serverret["success"]) {
851 $data = json_decode($serverret["body"]);
853 $version = $data->version;
855 $site_name = $data->name;
857 if (isset($data->network) AND ($platform == ""))
858 $platform = $data->network;
860 if ($platform == "Diaspora")
861 $network = NETWORK_DIASPORA;
863 if ($data->registrations_open)
864 $register_policy = REGISTER_OPEN;
866 $register_policy = REGISTER_CLOSED;
868 if (isset($data->version))
869 $last_contact = datetime_convert();
873 // Check for noscrape
874 // Friendica servers could be detected as OStatus servers
875 if (!$failure AND in_array($network, array(NETWORK_DFRN, NETWORK_OSTATUS))) {
876 $serverret = z_fetch_url($server_url."/friendica/json");
878 if (!$serverret["success"])
879 $serverret = z_fetch_url($server_url."/friendika/json");
881 if ($serverret["success"]) {
882 $data = json_decode($serverret["body"]);
884 if (isset($data->version)) {
885 $last_contact = datetime_convert();
886 $network = NETWORK_DFRN;
888 $noscrape = $data->no_scrape_url;
889 $version = $data->version;
890 $site_name = $data->site_name;
892 $register_policy_str = $data->register_policy;
893 $platform = $data->platform;
895 switch ($register_policy_str) {
896 case "REGISTER_CLOSED":
897 $register_policy = REGISTER_CLOSED;
899 case "REGISTER_APPROVE":
900 $register_policy = REGISTER_APPROVE;
902 case "REGISTER_OPEN":
903 $register_policy = REGISTER_OPEN;
912 $serverret = z_fetch_url($server_url."/poco");
913 if ($serverret["success"]) {
914 $data = json_decode($serverret["body"]);
915 if (isset($data->totalResults)) {
916 $poco = $server_url."/poco";
917 $last_contact = datetime_convert();
922 // Check again if the server exists
923 $servers = q("SELECT `nurl` FROM `gserver` WHERE `nurl` = '%s'", dbesc(normalise_link($server_url)));
926 q("UPDATE `gserver` SET `url` = '%s', `version` = '%s', `site_name` = '%s', `info` = '%s', `register_policy` = %d, `poco` = '%s', `noscrape` = '%s',
927 `network` = '%s', `platform` = '%s', `last_contact` = '%s', `last_failure` = '%s' WHERE `nurl` = '%s'",
932 intval($register_policy),
937 dbesc($last_contact),
938 dbesc($last_failure),
939 dbesc(normalise_link($server_url))
942 q("INSERT INTO `gserver` (`url`, `nurl`, `version`, `site_name`, `info`, `register_policy`, `poco`, `noscrape`, `network`, `platform`, `created`, `last_contact`, `last_failure`)
943 VALUES ('%s', '%s', '%s', '%s', '%s', %d, '%s', '%s', '%s', '%s', '%s', '%s', '%s')",
945 dbesc(normalise_link($server_url)),
949 intval($register_policy),
954 dbesc(datetime_convert()),
955 dbesc($last_contact),
956 dbesc($last_failure),
957 dbesc(datetime_convert())
960 logger("End discovery for server ".$server_url, LOGGER_DEBUG);
965 function poco_contact_from_body($body, $created, $cid, $uid) {
966 preg_replace_callback("/\[share(.*?)\].*?\[\/share\]/ism",
967 function ($match) use ($created, $cid, $uid){
968 return(sub_poco_from_share($match, $created, $cid, $uid));
972 function sub_poco_from_share($share, $created, $cid, $uid) {
974 preg_match("/profile='(.*?)'/ism", $share[1], $matches);
975 if ($matches[1] != "")
976 $profile = $matches[1];
978 preg_match('/profile="(.*?)"/ism', $share[1], $matches);
979 if ($matches[1] != "")
980 $profile = $matches[1];
985 logger("prepare poco_check for profile ".$profile, LOGGER_DEBUG);
986 poco_check($profile, "", "", "", "", "", "", "", "", $created, 3, $cid, $uid);
989 function poco_store($item) {
992 if ($item['private'])
995 // Or is it from a network where we don't store the global contacts?
996 if (!in_array($item["network"], array(NETWORK_DFRN, NETWORK_DIASPORA, NETWORK_OSTATUS, NETWORK_STATUSNET, "")))
999 // Is it a global copy?
1000 $store_gcontact = ($item["uid"] == 0);
1002 // Is it a comment on a global copy?
1003 if (!$store_gcontact AND ($item["uri"] != $item["parent-uri"])) {
1004 $q = q("SELECT `id` FROM `item` WHERE `uri`='%s' AND `uid` = 0", $item["parent-uri"]);
1005 $store_gcontact = count($q);
1008 if (!$store_gcontact)
1011 // "3" means: We don't know this contact directly (Maybe a reshared item)
1014 $profile_url = $item["author-link"];
1016 // Is it a user from our server?
1017 $q = q("SELECT `id` FROM `contact` WHERE `self` AND `nurl` = '%s' LIMIT 1",
1018 dbesc(normalise_link($item["author-link"])));
1020 logger("Our user (generation 1): ".$item["author-link"], LOGGER_DEBUG);
1022 $network = NETWORK_DFRN;
1023 } else { // Is it a contact from a user on our server?
1024 $q = q("SELECT `network`, `url` FROM `contact` WHERE `uid` != 0 AND `network` != ''
1025 AND (`nurl` = '%s' OR `alias` IN ('%s', '%s')) AND `network` != '%s' LIMIT 1",
1026 dbesc(normalise_link($item["author-link"])),
1027 dbesc(normalise_link($item["author-link"])),
1028 dbesc($item["author-link"]),
1029 dbesc(NETWORK_STATUSNET));
1032 $network = $q[0]["network"];
1033 $profile_url = $q[0]["url"];
1034 logger("Known contact (generation 2): ".$profile_url, LOGGER_DEBUG);
1038 if ($generation == 3)
1039 logger("Unknown contact (generation 3): ".$item["author-link"], LOGGER_DEBUG);
1041 poco_check($profile_url, $item["author-name"], $network, $item["author-avatar"], "", "", "", "", "", $item["received"], $generation, $item["contact-id"], $item["uid"]);
1043 // Maybe its a body with a shared item? Then extract a global contact from it.
1044 poco_contact_from_body($item["body"], $item["received"], $item["contact-id"], $item["uid"]);
1047 function count_common_friends($uid,$cid) {
1049 $r = q("SELECT count(*) as `total`
1050 FROM `glink` INNER JOIN `gcontact` on `glink`.`gcid` = `gcontact`.`id`
1051 WHERE `glink`.`cid` = %d AND `glink`.`uid` = %d AND
1052 ((`gcontact`.`last_contact` >= `gcontact`.`last_failure`) OR (`gcontact`.`updated` >= `gcontact`.`last_failure`))
1053 AND `gcontact`.`nurl` IN (select nurl from contact where uid = %d and self = 0 and blocked = 0 and hidden = 0 and id != %d ) ",
1060 // logger("count_common_friends: $uid $cid {$r[0]['total']}");
1062 return $r[0]['total'];
1068 function common_friends($uid,$cid,$start = 0,$limit=9999,$shuffle = false) {
1071 $sql_extra = " order by rand() ";
1073 $sql_extra = " order by `gcontact`.`name` asc ";
1075 $r = q("SELECT `gcontact`.*, `contact`.`id` AS `cid`
1077 INNER JOIN `gcontact` ON `glink`.`gcid` = `gcontact`.`id`
1078 INNER JOIN `contact` ON `gcontact`.`nurl` = `contact`.`nurl`
1079 WHERE `glink`.`cid` = %d and `glink`.`uid` = %d
1080 AND `contact`.`uid` = %d AND `contact`.`self` = 0 AND `contact`.`blocked` = 0
1081 AND `contact`.`hidden` = 0 AND `contact`.`id` != %d
1082 AND ((`gcontact`.`last_contact` >= `gcontact`.`last_failure`) OR (`gcontact`.`updated` >= `gcontact`.`last_failure`))
1083 $sql_extra LIMIT %d, %d",
1097 function count_common_friends_zcid($uid,$zcid) {
1099 $r = q("SELECT count(*) as `total`
1100 FROM `glink` INNER JOIN `gcontact` on `glink`.`gcid` = `gcontact`.`id`
1101 where `glink`.`zcid` = %d
1102 and `gcontact`.`nurl` in (select nurl from contact where uid = %d and self = 0 and blocked = 0 and hidden = 0 ) ",
1108 return $r[0]['total'];
1113 function common_friends_zcid($uid,$zcid,$start = 0, $limit = 9999,$shuffle = false) {
1116 $sql_extra = " order by rand() ";
1118 $sql_extra = " order by `gcontact`.`name` asc ";
1120 $r = q("SELECT `gcontact`.*
1121 FROM `glink` INNER JOIN `gcontact` on `glink`.`gcid` = `gcontact`.`id`
1122 where `glink`.`zcid` = %d
1123 and `gcontact`.`nurl` in (select nurl from contact where uid = %d and self = 0 and blocked = 0 and hidden = 0 )
1124 $sql_extra limit %d, %d",
1136 function count_all_friends($uid,$cid) {
1138 $r = q("SELECT count(*) as `total`
1139 FROM `glink` INNER JOIN `gcontact` on `glink`.`gcid` = `gcontact`.`id`
1140 where `glink`.`cid` = %d and `glink`.`uid` = %d AND
1141 ((`gcontact`.`last_contact` >= `gcontact`.`last_failure`) OR (`gcontact`.`updated` >= `gcontact`.`last_failure`))",
1147 return $r[0]['total'];
1153 function all_friends($uid,$cid,$start = 0, $limit = 80) {
1155 $r = q("SELECT `gcontact`.*, `contact`.`id` AS `cid`
1157 INNER JOIN `gcontact` on `glink`.`gcid` = `gcontact`.`id`
1158 LEFT JOIN `contact` ON `contact`.`nurl` = `gcontact`.`nurl` AND `contact`.`uid` = %d
1159 WHERE `glink`.`cid` = %d AND `glink`.`uid` = %d AND
1160 ((`gcontact`.`last_contact` >= `gcontact`.`last_failure`) OR (`gcontact`.`updated` >= `gcontact`.`last_failure`))
1161 ORDER BY `gcontact`.`name` ASC LIMIT %d, %d ",
1174 function suggestion_query($uid, $start = 0, $limit = 80) {
1179 $network = array(NETWORK_DFRN);
1181 if (get_config('system','diaspora_enabled'))
1182 $network[] = NETWORK_DIASPORA;
1184 if (!get_config('system','ostatus_disabled'))
1185 $network[] = NETWORK_OSTATUS;
1187 $sql_network = implode("', '", $network);
1188 //$sql_network = "'".$sql_network."', ''";
1189 $sql_network = "'".$sql_network."'";
1191 $r = q("SELECT count(glink.gcid) as `total`, gcontact.* from gcontact
1192 INNER JOIN `glink` ON `glink`.`gcid` = `gcontact`.`id`
1193 where uid = %d and not gcontact.nurl in ( select nurl from contact where uid = %d )
1194 AND NOT `gcontact`.`name` IN (SELECT `name` FROM `contact` WHERE `uid` = %d)
1195 AND NOT `gcontact`.`id` IN (SELECT `gcid` FROM `gcign` WHERE `uid` = %d)
1196 AND `gcontact`.`updated` != '0000-00-00 00:00:00'
1197 AND `gcontact`.`last_contact` >= `gcontact`.`last_failure`
1198 AND `gcontact`.`network` IN (%s)
1199 GROUP BY `glink`.`gcid` ORDER BY `gcontact`.`updated` DESC,`total` DESC LIMIT %d, %d",
1209 if(count($r) && count($r) >= ($limit -1))
1212 $r2 = q("SELECT gcontact.* FROM gcontact
1213 INNER JOIN `glink` ON `glink`.`gcid` = `gcontact`.`id`
1214 WHERE `glink`.`uid` = 0 AND `glink`.`cid` = 0 AND `glink`.`zcid` = 0 AND NOT `gcontact`.`nurl` IN (SELECT `nurl` FROM `contact` WHERE `uid` = %d)
1215 AND NOT `gcontact`.`name` IN (SELECT `name` FROM `contact` WHERE `uid` = %d)
1216 AND NOT `gcontact`.`id` IN (SELECT `gcid` FROM `gcign` WHERE `uid` = %d)
1217 AND `gcontact`.`updated` != '0000-00-00 00:00:00'
1218 AND `gcontact`.`last_contact` >= `gcontact`.`last_failure`
1219 AND `gcontact`.`network` IN (%s)
1220 ORDER BY rand() LIMIT %d, %d",
1230 foreach ($r2 AS $suggestion)
1231 $list[$suggestion["nurl"]] = $suggestion;
1233 foreach ($r AS $suggestion)
1234 $list[$suggestion["nurl"]] = $suggestion;
1236 while (sizeof($list) > ($limit))
1242 function update_suggestions() {
1248 /// TODO Check if it is really neccessary to poll the own server
1249 poco_load(0,0,0,$a->get_baseurl() . '/poco');
1251 $done[] = $a->get_baseurl() . '/poco';
1253 if(strlen(get_config('system','directory'))) {
1254 $x = fetch_url(get_server()."/pubsites");
1256 $j = json_decode($x);
1258 foreach($j->entries as $entry) {
1260 poco_check_server($entry->url);
1262 $url = $entry->url . '/poco';
1263 if(! in_array($url,$done))
1264 poco_load(0,0,0,$entry->url . '/poco');
1270 // Query your contacts from Friendica and Redmatrix/Hubzilla for their contacts
1271 $r = q("SELECT DISTINCT(`poco`) AS `poco` FROM `contact` WHERE `network` IN ('%s', '%s')",
1272 dbesc(NETWORK_DFRN), dbesc(NETWORK_DIASPORA)
1276 foreach($r as $rr) {
1277 $base = substr($rr['poco'],0,strrpos($rr['poco'],'/'));
1278 if(! in_array($base,$done))
1279 poco_load(0,0,0,$base);
1284 function poco_discover_federation() {
1285 $last = get_config('poco','last_federation_discovery');
1288 $next = $last + (24 * 60 * 60);
1293 $serverdata = fetch_url("http://the-federation.info/pods.json");
1298 $servers = json_decode($serverdata);
1300 foreach($servers->pods AS $server)
1301 poco_check_server("https://".$server->host);
1303 set_config('poco','last_federation_discovery', time());
1307 function poco_discover($complete = false) {
1309 // Update the server list
1310 poco_discover_federation();
1314 $requery_days = intval(get_config("system", "poco_requery_days"));
1316 if ($requery_days == 0)
1319 $last_update = date("c", time() - (60 * 60 * 24 * $requery_days));
1321 $r = q("SELECT `poco`, `nurl`, `url`, `network` FROM `gserver` WHERE `last_contact` >= `last_failure` AND `poco` != '' AND `last_poco_query` < '%s' ORDER BY RAND()", dbesc($last_update));
1323 foreach ($r AS $server) {
1325 if (!poco_check_server($server["url"], $server["network"])) {
1326 // The server is not reachable? Okay, then we will try it later
1327 q("UPDATE `gserver` SET `last_poco_query` = '%s' WHERE `nurl` = '%s'", dbesc(datetime_convert()), dbesc($server["nurl"]));
1331 // Fetch all users from the other server
1332 $url = $server["poco"]."/?fields=displayName,urls,photos,updated,network,aboutMe,currentLocation,tags,gender,generation";
1334 logger("Fetch all users from the server ".$server["nurl"], LOGGER_DEBUG);
1336 $retdata = z_fetch_url($url);
1337 if ($retdata["success"]) {
1338 $data = json_decode($retdata["body"]);
1340 poco_discover_server($data, 2);
1342 if (get_config('system','poco_discovery') > 1) {
1344 $timeframe = get_config('system','poco_discovery_since');
1345 if ($timeframe == 0)
1348 $updatedSince = date("Y-m-d H:i:s", time() - $timeframe * 86400);
1350 // Fetch all global contacts from the other server (Not working with Redmatrix and Friendica versions before 3.3)
1351 $url = $server["poco"]."/@global?updatedSince=".$updatedSince."&fields=displayName,urls,photos,updated,network,aboutMe,currentLocation,tags,gender,generation";
1355 $retdata = z_fetch_url($url);
1356 if ($retdata["success"]) {
1357 logger("Fetch all global contacts from the server ".$server["nurl"], LOGGER_DEBUG);
1358 $success = poco_discover_server(json_decode($retdata["body"]));
1361 if (!$success AND (get_config('system','poco_discovery') > 2)) {
1362 logger("Fetch contacts from users of the server ".$server["nurl"], LOGGER_DEBUG);
1363 poco_discover_server_users($data, $server);
1367 q("UPDATE `gserver` SET `last_poco_query` = '%s' WHERE `nurl` = '%s'", dbesc(datetime_convert()), dbesc($server["nurl"]));
1368 if (!$complete AND (--$no_of_queries == 0))
1371 // If the server hadn't replied correctly, then force a sanity check
1372 poco_check_server($server["url"], $server["network"], true);
1374 // If we couldn't reach the server, we will try it some time later
1375 q("UPDATE `gserver` SET `last_poco_query` = '%s' WHERE `nurl` = '%s'", dbesc(datetime_convert()), dbesc($server["nurl"]));
1380 function poco_discover_server_users($data, $server) {
1382 if (!isset($data->entry))
1385 foreach ($data->entry AS $entry) {
1387 if (isset($entry->urls)) {
1388 foreach($entry->urls as $url)
1389 if($url->type == 'profile') {
1390 $profile_url = $url->value;
1391 $urlparts = parse_url($profile_url);
1392 $username = end(explode("/", $urlparts["path"]));
1395 if ($username != "") {
1396 logger("Fetch contacts for the user ".$username." from the server ".$server["nurl"], LOGGER_DEBUG);
1398 // Fetch all contacts from a given user from the other server
1399 $url = $server["poco"]."/".$username."/?fields=displayName,urls,photos,updated,network,aboutMe,currentLocation,tags,gender,generation";
1401 $retdata = z_fetch_url($url);
1402 if ($retdata["success"])
1403 poco_discover_server(json_decode($retdata["body"]), 3);
1408 function poco_discover_server($data, $default_generation = 0) {
1410 if (!isset($data->entry) OR !count($data->entry))
1415 foreach ($data->entry AS $entry) {
1417 $profile_photo = '';
1421 $updated = '0000-00-00 00:00:00';
1426 $generation = $default_generation;
1428 $name = $entry->displayName;
1430 if(isset($entry->urls)) {
1431 foreach($entry->urls as $url) {
1432 if($url->type == 'profile') {
1433 $profile_url = $url->value;
1436 if($url->type == 'webfinger') {
1437 $connect_url = str_replace('acct:' , '', $url->value);
1443 if(isset($entry->photos)) {
1444 foreach($entry->photos as $photo) {
1445 if($photo->type == 'profile') {
1446 $profile_photo = $photo->value;
1452 if(isset($entry->updated))
1453 $updated = date("Y-m-d H:i:s", strtotime($entry->updated));
1455 if(isset($entry->network))
1456 $network = $entry->network;
1458 if(isset($entry->currentLocation))
1459 $location = $entry->currentLocation;
1461 if(isset($entry->aboutMe))
1462 $about = html2bbcode($entry->aboutMe);
1464 if(isset($entry->gender))
1465 $gender = $entry->gender;
1467 if(isset($entry->generation) AND ($entry->generation > 0))
1468 $generation = ++$entry->generation;
1470 if(isset($entry->tags))
1471 foreach($entry->tags as $tag)
1472 $keywords = implode(", ", $tag);
1474 if ($generation > 0) {
1477 logger("Store profile ".$profile_url, LOGGER_DEBUG);
1478 poco_check($profile_url, $name, $network, $profile_photo, $about, $location, $gender, $keywords, $connect_url, $updated, $generation, 0, 0, 0);
1479 logger("Done for profile ".$profile_url, LOGGER_DEBUG);