]> git.mxchange.org Git - friendica.git/blobdiff - include/discover_poco.php
Merge pull request #2682 from annando/1607-api-generic-xml
[friendica.git] / include / discover_poco.php
index c69e27fef1712d9d6edc157edcbe3d0d2845e48c..0b468faea189e522505ed5c686facd22be905406 100644 (file)
@@ -13,58 +13,202 @@ function discover_poco_run(&$argv, &$argc){
 
        if(is_null($db)) {
            @include(".htconfig.php");
-       require_once("include/dba.php");
+       require_once("include/dba.php");
            $db = new dba($db_host, $db_user, $db_pass, $db_data);
-       unset($db_host, $db_user, $db_pass, $db_data);
-       };
+       unset($db_host, $db_user, $db_pass, $db_data);
+       };
 
        require_once('include/session.php');
        require_once('include/datetime.php');
-       require_once('include/pidfile.php');
 
        load_config('config');
        load_config('system');
 
-       $maxsysload = intval(get_config('system','maxloadavg'));
-       if($maxsysload < 1)
-               $maxsysload = 50;
-       if(function_exists('sys_getloadavg')) {
-               $load = sys_getloadavg();
-               if(intval($load[0]) > $maxsysload) {
-                       logger('system: load ' . $load[0] . ' too high. discover_poco deferred to next scheduled run.');
+       // Don't check this stuff if the function is called by the poller
+       if (App::callstack() != "poller_run")
+               if (App::maxload_reached())
                        return;
+
+       if(($argc > 2) && ($argv[1] == "dirsearch")) {
+               $search = urldecode($argv[2]);
+               $mode = 1;
+       } elseif(($argc == 2) && ($argv[1] == "checkcontact")) {
+               $mode = 2;
+       } elseif(($argc == 2) && ($argv[1] == "suggestions")) {
+               $mode = 3;
+       } elseif ($argc == 1) {
+               $search = "";
+               $mode = 0;
+       } else
+               die("Unknown or missing parameter ".$argv[1]."\n");
+
+       // Don't check this stuff if the function is called by the poller
+       if (App::callstack() != "poller_run")
+               if (App::is_already_running('discover_poco'.$mode.urlencode($search), 'include/discover_poco.php', 1140))
+                       return;
+
+       $a->set_baseurl(get_config('system','url'));
+
+       load_hooks();
+
+       logger('start '.$search);
+
+       if ($mode==3)
+               update_suggestions();
+       elseif (($mode == 2) AND get_config('system','poco_completion'))
+               discover_users();
+       elseif (($mode == 1) AND ($search != "") and get_config('system','poco_local_search')) {
+               discover_directory($search);
+               gs_search_user($search);
+       } elseif (($mode == 0) AND ($search == "") and (get_config('system','poco_discovery') > 0)) {
+               // Query Friendica and Hubzilla servers for their users
+               poco_discover();
+
+               // Query GNU Social servers for their users ("statistics" addon has to be enabled on the GS server)
+               if (!get_config('system','ostatus_disabled'))
+                       gs_discover();
+       }
+
+       logger('end '.$search);
+
+       return;
+}
+
+function discover_users() {
+       logger("Discover users", LOGGER_DEBUG);
+
+       $users = q("SELECT `url`, `created`, `updated`, `last_failure`, `last_contact`, `server_url` FROM `gcontact`
+                       WHERE `last_contact` < UTC_TIMESTAMP - INTERVAL 1 MONTH AND
+                               `last_failure` < UTC_TIMESTAMP - INTERVAL 1 MONTH AND
+                               `network` IN ('%s', '%s', '%s', '%s', '') ORDER BY rand()",
+                       dbesc(NETWORK_DFRN), dbesc(NETWORK_DIASPORA),
+                       dbesc(NETWORK_OSTATUS), dbesc(NETWORK_FEED));
+
+       if (!$users)
+               return;
+
+       $checked = 0;
+
+       foreach ($users AS $user) {
+
+               $urlparts = parse_url($user["url"]);
+               if (!isset($urlparts["scheme"])) {
+                       q("UPDATE `gcontact` SET `network` = '%s' WHERE `nurl` = '%s'",
+                               dbesc(NETWORK_PHANTOM), dbesc(normalise_link($user["url"])));
+                       continue;
+                }
+
+               if (in_array($urlparts["host"], array("www.facebook.com", "facebook.com", "twitter.com",
+                                                       "identi.ca", "alpha.app.net"))) {
+                       $networks = array("www.facebook.com" => NETWORK_FACEBOOK,
+                                       "facebook.com" => NETWORK_FACEBOOK,
+                                       "twitter.com" => NETWORK_TWITTER,
+                                       "identi.ca" => NETWORK_PUMPIO,
+                                       "alpha.app.net" => NETWORK_APPNET);
+
+                       q("UPDATE `gcontact` SET `network` = '%s' WHERE `nurl` = '%s'",
+                               dbesc($networks[$urlparts["host"]]), dbesc(normalise_link($user["url"])));
+                       continue;
                }
+
+               if ($user["server_url"] != "")
+                       $server_url = $user["server_url"];
+               else
+                       $server_url = poco_detect_server($user["url"]);
+
+               if (($server_url == "") OR poco_check_server($server_url, $gcontacts[0]["network"])) {
+                       logger('Check user '.$user["url"]);
+                       poco_last_updated($user["url"], true);
+
+                       if (++$checked > 100)
+                               return;
+               } else
+                       q("UPDATE `gcontact` SET `last_failure` = '%s' WHERE `nurl` = '%s'",
+                               dbesc(datetime_convert()), dbesc(normalise_link($user["url"])));
        }
+}
+
+function discover_directory($search) {
 
-       $lockpath = get_lockpath();
-       if ($lockpath != '') {
-               $pidfile = new pidfile($lockpath, 'discover_poco');
-               if($pidfile->is_already_running()) {
-                       logger("discover_poco: Already running");
-                       if ($pidfile->running_time() > 19*60) {
-                                $pidfile->kill();
-                                logger("discover_poco: killed stale process");
-                               // Calling a new instance
-                               proc_run('php','include/discover_poco.php');
-                        }
-                       exit;
+       $data = Cache::get("dirsearch:".$search);
+       if (!is_null($data)){
+               // Only search for the same item every 24 hours
+               if (time() < $data + (60 * 60 * 24)) {
+                       logger("Already searched for ".$search." in the last 24 hours", LOGGER_DEBUG);
+                       return;
                }
        }
 
-       $a->set_baseurl(get_config('system','url'));
+       $x = fetch_url(get_server()."/lsearch?p=1&n=500&search=".urlencode($search));
+       $j = json_decode($x);
+
+       if(count($j->results))
+               foreach($j->results as $jj) {
+                       // Check if the contact already exists
+                       $exists = q("SELECT `id`, `last_contact`, `last_failure`, `updated` FROM `gcontact` WHERE `nurl` = '%s'", normalise_link($jj->url));
+                       if ($exists) {
+                               logger("Profile ".$jj->url." already exists (".$search.")", LOGGER_DEBUG);
+
+                               if (($exists[0]["last_contact"] < $exists[0]["last_failure"]) AND
+                                       ($exists[0]["updated"] < $exists[0]["last_failure"]))
+                                       continue;
+
+                               // Update the contact
+                               poco_last_updated($jj->url);
+                               continue;
+                       }
+
+                       // Harcoded paths aren't so good. But in this case it is okay.
+                       // First: We only will get Friendica contacts (which always are using this url schema)
+                       // Second: There will be no further problems if we are doing a mistake
+                       $server_url = preg_replace("=(https?://)(.*)/profile/(.*)=ism", "$1$2", $jj->url);
+                       if ($server_url != $jj->url)
+                               if (!poco_check_server($server_url)) {
+                                       logger("Friendica server ".$server_url." doesn't answer.", LOGGER_DEBUG);
+                                       continue;
+                               }
+                                       logger("Friendica server ".$server_url." seems to be okay.", LOGGER_DEBUG);
+
+                       logger("Check if profile ".$jj->url." is reachable (".$search.")", LOGGER_DEBUG);
+                       $data = probe_url($jj->url);
+                       if ($data["network"] == NETWORK_DFRN) {
+                               logger("Add profile ".$jj->url." to local directory (".$search.")", LOGGER_DEBUG);
+                               poco_check($data["url"], $data["name"], $data["network"], $data["photo"], "", "", "", $jj->tags, $data["addr"], "", 0);
+                       }
+               }
+       Cache::set("dirsearch:".$search, time(), CACHE_DAY);
+}
 
-       load_hooks();
+/**
+ * @brief Search for GNU Social user with gstools.org
+ *
+ * @param str $search User name
+ */
+function gs_search_user($search) {
 
-       logger('start');
+       $a = get_app();
 
-       if (get_config('system','poco_discovery') > 0)
-               poco_discover();
+       $url = "http://gstools.org/api/users_search/".urlencode($search);
 
-       logger('end');
+       $result = z_fetch_url($url);
+       if (!$result["success"])
+               return false;
 
-       return;
+       $contacts = json_decode($result["body"]);
+
+       if ($contacts->status == 'ERROR')
+               return false;
+
+       foreach($contacts->data AS $user) {
+               $contact = probe_url($user->site_address."/".$user->name);
+               if ($contact["network"] != NETWORK_PHANTOM) {
+                       $contact["about"] = $user->description;
+                       update_gcontact($contact);
+               }
+       }
 }
 
+
 if (array_search(__file__,get_included_files())===0){
   discover_poco_run($_SERVER["argv"],$_SERVER["argc"]);
   killme();