]> git.mxchange.org Git - friendica.git/blobdiff - include/Probe.php
Workaround for vanished database connections while authentication
[friendica.git] / include / Probe.php
index 8a606ecaef5f43309b752acc1a4e965de7ffe728..14e8d5bcad8ab2593547a100bb12c3fa09a365bf 100644 (file)
@@ -1,13 +1,7 @@
 <?php
 /**
- * @brief This class contain functions for probing URL
- *
- * To-Do:
- *
- * - OStatus links with index.php
- * - OStatus alias link
- * - Non absolute URL in feeds?
- * - Workaround for misconfigured Friendica servers?
+ * @file include/Probe.php
+ * @brief Functions for probing URL
  *
  */
 
@@ -18,6 +12,10 @@ require_once("include/feed.php");
 require_once('include/email.php');
 require_once('include/network.php');
 
+/**
+ * @brief This class contain functions for probing URL
+ *
+ */
 class Probe {
 
        /**
@@ -77,6 +75,7 @@ class Probe {
                        return false;
 
                $xrd_data = array();
+
                foreach ($links["xrd"]["link"] AS $value => $link) {
                        if (isset($link["@attributes"]))
                                $attributes = $link["@attributes"];
@@ -98,7 +97,113 @@ class Probe {
        }
 
        /**
-        * @brief Fetch information about a given uri
+        * @brief Perform Webfinger lookup and return DFRN data
+        *
+        * Given an email style address, perform webfinger lookup and
+        * return the resulting DFRN profile URL, or if no DFRN profile URL
+        * is located, returns an OStatus subscription template (prefixed
+        * with the string 'stat:' to identify it as on OStatus template).
+        * If this isn't an email style address just return $webbie.
+        * Return an empty string if email-style addresses but webfinger fails,
+        * or if the resultant personal XRD doesn't contain a supported
+        * subscription/friend-request attribute.
+        *
+        * amended 7/9/2011 to return an hcard which could save potentially loading
+        * a lengthy content page to scrape dfrn attributes
+        *
+        * @param string $webbie Address that should be probed
+        * @param string $hcard Link to the hcard - is returned by reference
+        *
+        * @return string profile link
+        */
+
+       public static function webfinger_dfrn($webbie, &$hcard) {
+
+               $profile_link = '';
+
+               $links = self::lrdd($webbie);
+               logger('webfinger_dfrn: '.$webbie.':'.print_r($links,true), LOGGER_DATA);
+               if (count($links)) {
+                       foreach ($links as $link) {
+                               if ($link['@attributes']['rel'] === NAMESPACE_DFRN)
+                                       $profile_link = $link['@attributes']['href'];
+                               if (($link['@attributes']['rel'] === NAMESPACE_OSTATUSSUB) AND ($profile_link == ""))
+                                       $profile_link = 'stat:'.$link['@attributes']['template'];
+                               if ($link['@attributes']['rel'] === 'http://microformats.org/profile/hcard')
+                                       $hcard = $link['@attributes']['href'];
+                       }
+               }
+               return $profile_link;
+       }
+
+       /**
+        * @brief Check an URI for LRDD data
+        *
+        * this is a replacement for the "lrdd" function in include/network.php.
+        * It isn't used in this class and has some redundancies in the code.
+        * When time comes we can check the existing calls for "lrdd" if we can rework them.
+        *
+        * @param string $uri Address that should be probed
+        *
+        * @return array uri data
+        */
+       public static function lrdd($uri) {
+
+               $lrdd = self::xrd($uri);
+
+               if (!$lrdd) {
+                       $parts = @parse_url($uri);
+                       if (!$parts)
+                               return array();
+
+                       $host = $parts["host"];
+
+                       $path_parts = explode("/", trim($parts["path"], "/"));
+
+                       do {
+                               $lrdd = self::xrd($host);
+                               $host .= "/".array_shift($path_parts);
+                       } while (!$lrdd AND (sizeof($path_parts) > 0));
+               }
+
+               if (!$lrdd)
+                       return array();
+
+               foreach ($lrdd AS $key => $link) {
+                       if ($webfinger)
+                               continue;
+
+                       if (!in_array($key, array("lrdd", "lrdd-xml", "lrdd-json")))
+                               continue;
+
+                       $path = str_replace('{uri}', urlencode($uri), $link);
+                       $webfinger = self::webfinger($path);
+
+                       if (!$webfinger AND (strstr($uri, "@"))) {
+                               $path = str_replace('{uri}', urlencode("acct:".$uri), $link);
+                               $webfinger = self::webfinger($path);
+                       }
+               }
+
+               if (!is_array($webfinger["links"]))
+                       return false;
+
+               $data = array();
+
+               foreach ($webfinger["links"] AS $link)
+                       $data[] = array("@attributes" => $link);
+
+               if (is_array($webfinger["aliases"]))
+                       foreach ($webfinger["aliases"] AS $alias)
+                               $data[] = array("@attributes" =>
+                                                       array("rel" => "alias",
+                                                               "href" => $alias));
+
+               return $data;
+       }
+
+       /**
+        * @brief Fetch information (protocol endpoints and user information) about a given uri
         *
         * @param string $uri Address that should be probed
         * @param string $network Test for this specific network
@@ -112,7 +217,6 @@ class Probe {
                if ($cache) {
                        $result = Cache::get("probe_url:".$network.":".$uri);
                        if (!is_null($result)) {
-                               $result = unserialize($result);
                                return $result;
                        }
                }
@@ -130,10 +234,15 @@ class Probe {
                else
                        $data["photo"] = App::get_baseurl().'/images/person-175.jpg';
 
-               if (!isset($data["name"]))
-                       $data["name"] = $data["url"];
+               if (!isset($data["name"]) OR ($data["name"] == "")) {
+                       if (isset($data["nick"]))
+                               $data["name"] = $data["nick"];
 
-               if (!isset($data["nick"])) {
+                       if ($data["name"] == "")
+                               $data["name"] = $data["url"];
+               }
+
+               if (!isset($data["nick"]) OR ($data["nick"] == "")) {
                        $data["nick"] = strtolower($data["name"]);
 
                        if (strpos($data['nick'], ' '))
@@ -147,7 +256,7 @@ class Probe {
 
                // Only store into the cache if the value seems to be valid
                if (!in_array($data['network'], array(NETWORK_PHANTOM, NETWORK_MAIL))) {
-                       Cache::set("probe_url:".$network.":".$uri,serialize($data), CACHE_DAY);
+                       Cache::set("probe_url:".$network.":".$uri, $data, CACHE_DAY);
 
                        /// @todo temporary fix - we need a real contact update function that updates only changing fields
                        /// The biggest problem is the avatar picture that could have a reduced image size.
@@ -172,7 +281,9 @@ class Probe {
        }
 
        /**
-        * @brief Detect information about a given uri
+        * @brief Fetch information (protocol endpoints and user information) about a given uri
+        *
+        * This function is only called by the "uri" function that adds caching and rearranging of data.
         *
         * @param string $uri Address that should be probed
         * @param string $network Test for this specific network
@@ -182,7 +293,7 @@ class Probe {
         */
        private function detect($uri, $network, $uid) {
                if (strstr($uri, '@')) {
-                       // If the URI starts with "mailto:" then jum directly to the mail detection
+                       // If the URI starts with "mailto:" then jump directly to the mail detection
                        if (strpos($url,'mailto:') !== false) {
                                $uri = str_replace('mailto:', '', $url);
                                return self::mail($uri, $uid);
@@ -201,6 +312,7 @@ class Probe {
                                return array("network" => NETWORK_TWITTER);
 
                        $lrdd = self::xrd($host);
+
                        if (!$lrdd)
                                return self::mail($uri, $uid);
 
@@ -247,6 +359,12 @@ class Probe {
                        $path = str_replace('{uri}', urlencode($addr), $link);
                        $webfinger = self::webfinger($path);
 
+                       // Mastodon needs to have it with "acct:"
+                       if (!$webfinger) {
+                               $path = str_replace('{uri}', urlencode("acct:".$addr), $link);
+                               $webfinger = self::webfinger($path);
+                       }
+
                        // If webfinger wasn't successful then try it with the URL - possibly in the format https://...
                        if (!$webfinger AND ($uri != $addr)) {
                                $path = str_replace('{uri}', urlencode($uri), $link);
@@ -299,7 +417,9 @@ class Probe {
        }
 
        /**
-        * @brief Do a webfinger request
+        * @brief Perform a webfinger request.
+        *
+        * For details see RFC 7033: <https://tools.ietf.org/html/rfc7033>
         *
         * @param string $url Address that should be probed
         *
@@ -351,7 +471,10 @@ class Probe {
        }
 
        /**
-        * @brief Poll the noscrape page (Friendica specific)
+        * @brief Poll the Friendica specific noscrape page.
+        *
+        * "noscrape" is a faster alternative to fetch the data from the hcard.
+        * This functionality was originally created for the directory.
         *
         * @param string $noscrape Link to the noscrape page
         * @param array $data The already fetched data
@@ -436,7 +559,7 @@ class Probe {
        }
 
        /**
-        * @brief Fetch data from a DFRN profile page
+        * @brief Fetch data from a DFRN profile page and via "noscrape"
         *
         * @param string $profile Link to the profile page
         *
@@ -446,6 +569,8 @@ class Probe {
 
                $data = array();
 
+               logger("Check profile ".$profile, LOGGER_DEBUG);
+
                // Fetch data via noscrape - this is faster
                $noscrape = str_replace(array("/hcard/", "/profile/"), "/noscrape/", $profile);
                $data = self::poll_noscrape($noscrape, $data);
@@ -468,6 +593,8 @@ class Probe {
                $prof_data["fn"] = $data["name"];
                $prof_data["key"] = $data["pubkey"];
 
+               logger("Result for profile ".$profile.": ".print_r($prof_data, true), LOGGER_DEBUG);
+
                return $prof_data;
        }
 
@@ -537,8 +664,12 @@ class Probe {
         */
        private function poll_hcard($hcard, $data, $dfrn = false) {
 
+               $content = fetch_url($hcard);
+               if (!$content)
+                       return false;
+
                $doc = new DOMDocument();
-               if (!@$doc->loadHTMLFile($hcard))
+               if (!@$doc->loadHTML($content))
                        return false;
 
                $xpath = new DomXPath($doc);
@@ -547,40 +678,39 @@ class Probe {
                if (!is_object($vcards))
                        return false;
 
-               if ($vcards->length == 0)
-                       return false;
+               if ($vcards->length > 0) {
+                       $vcard = $vcards->item(0);
 
-               $vcard = $vcards->item(0);
+                       // We have to discard the guid from the hcard in favour of the guid from lrdd
+                       // Reason: Hubzilla doesn't use the value "uid" in the hcard like Diaspora does.
+                       $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' uid ')]", $vcard); // */
+                       if (($search->length > 0) AND ($data["guid"] == ""))
+                               $data["guid"] = $search->item(0)->nodeValue;
 
-               // We have to discard the guid from the hcard in favour of the guid from lrdd
-               // Reason: Hubzilla doesn't use the value "uid" in the hcard like Diaspora does.
-               $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' uid ')]", $vcard); // */
-               if (($search->length > 0) AND ($data["guid"] == ""))
-                       $data["guid"] = $search->item(0)->nodeValue;
+                       $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' nickname ')]", $vcard); // */
+                       if ($search->length > 0)
+                               $data["nick"] = $search->item(0)->nodeValue;
 
-               $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' nickname ')]", $vcard); // */
-               if ($search->length > 0)
-                       $data["nick"] = $search->item(0)->nodeValue;
+                       $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' fn ')]", $vcard); // */
+                       if ($search->length > 0)
+                               $data["name"] = $search->item(0)->nodeValue;
 
-               $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' fn ')]", $vcard); // */
-               if ($search->length > 0)
-                       $data["name"] = $search->item(0)->nodeValue;
+                       $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' searchable ')]", $vcard); // */
+                       if ($search->length > 0)
+                               $data["searchable"] = $search->item(0)->nodeValue;
 
-               $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' searchable ')]", $vcard); // */
-               if ($search->length > 0)
-                       $data["searchable"] = $search->item(0)->nodeValue;
+                       $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' key ')]", $vcard); // */
+                       if ($search->length > 0) {
+                               $data["pubkey"] = $search->item(0)->nodeValue;
+                               if (strstr($data["pubkey"], 'RSA '))
+                                       $data["pubkey"] = rsatopem($data["pubkey"]);
+                       }
 
-               $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' key ')]", $vcard); // */
-               if ($search->length > 0) {
-                       $data["pubkey"] = $search->item(0)->nodeValue;
-                       if (strstr($data["pubkey"], 'RSA '))
-                               $data["pubkey"] = rsatopem($data["pubkey"]);
+                       $search = $xpath->query("//*[@id='pod_location']", $vcard); // */
+                       if ($search->length > 0)
+                               $data["baseurl"] = trim($search->item(0)->nodeValue, "/");
                }
 
-               $search = $xpath->query("//*[@id='pod_location']", $vcard); // */
-               if ($search->length > 0)
-                       $data["baseurl"] = trim($search->item(0)->nodeValue, "/");
-
                $avatar = array();
                $photos = $xpath->query("//*[contains(concat(' ', @class, ' '), ' photo ') or contains(concat(' ', @class, ' '), ' avatar ')]", $vcard); // */
                foreach ($photos AS $photo) {
@@ -674,6 +804,9 @@ class Probe {
                        isset($data["pubkey"]) AND ($hcard != "")) {
                        $data["network"] = NETWORK_DIASPORA;
 
+                       // The Diaspora handle must always be lowercase
+                       $data["addr"] = strtolower($data["addr"]);
+
                        // We have to overwrite the detected value for "notify" since Hubzilla doesn't send it
                        $data["notify"] = $data["baseurl"]."/receive/users/".$data["guid"];
                        $data["batch"] = $data["baseurl"]."/receive/public";
@@ -698,6 +831,9 @@ class Probe {
                                if (strstr($alias, "@"))
                                        $data["addr"] = str_replace('acct:', '', $alias);
 
+               if (is_string($webfinger["subject"]) AND strstr($webfinger["subject"], "@"))
+                       $data["addr"] = str_replace('acct:', '', $webfinger["subject"]);
+
                $pubkey = "";
                foreach ($webfinger["links"] AS $link) {
                        if (($link["rel"] == "http://webfinger.net/rel/profile-page") AND
@@ -715,7 +851,7 @@ class Probe {
                                                $pubkey = substr($pubkey, strpos($pubkey, ',') + 1);
                                        else
                                                $pubkey = substr($pubkey, 5);
-                               } else
+                               } elseif (normalise_link($pubkey) == 'http://')
                                        $pubkey = fetch_url($pubkey);
 
                                $key = explode(".", $pubkey);