<?php
/**
- * @brief This class contain functions for probing URL
- *
- * To-Do:
- *
- * - OStatus links with index.php
- * - OStatus alias link
- * - Non absolute URL in feeds?
- * - Workaround for misconfigured Friendica servers?
+ * @file include/Probe.php
+ * @brief Functions for probing URL
*
*/
require_once('include/email.php');
require_once('include/network.php');
+/**
+ * @brief This class contain functions for probing URL
+ *
+ */
class Probe {
/**
return false;
$xrd_data = array();
+
foreach ($links["xrd"]["link"] AS $value => $link) {
if (isset($link["@attributes"]))
$attributes = $link["@attributes"];
}
/**
- * @brief Fetch information about a given uri
+ * @brief Perform Webfinger lookup and return DFRN data
+ *
+ * Given an email style address, perform webfinger lookup and
+ * return the resulting DFRN profile URL, or if no DFRN profile URL
+ * is located, returns an OStatus subscription template (prefixed
+ * with the string 'stat:' to identify it as on OStatus template).
+ * If this isn't an email style address just return $webbie.
+ * Return an empty string if email-style addresses but webfinger fails,
+ * or if the resultant personal XRD doesn't contain a supported
+ * subscription/friend-request attribute.
+ *
+ * amended 7/9/2011 to return an hcard which could save potentially loading
+ * a lengthy content page to scrape dfrn attributes
+ *
+ * @param string $webbie Address that should be probed
+ * @param string $hcard Link to the hcard - is returned by reference
+ *
+ * @return string profile link
+ */
+
+ public static function webfinger_dfrn($webbie, &$hcard) {
+
+ $profile_link = '';
+
+ $links = self::lrdd($webbie);
+ logger('webfinger_dfrn: '.$webbie.':'.print_r($links,true), LOGGER_DATA);
+ if (count($links)) {
+ foreach ($links as $link) {
+ if ($link['@attributes']['rel'] === NAMESPACE_DFRN)
+ $profile_link = $link['@attributes']['href'];
+ if (($link['@attributes']['rel'] === NAMESPACE_OSTATUSSUB) AND ($profile_link == ""))
+ $profile_link = 'stat:'.$link['@attributes']['template'];
+ if ($link['@attributes']['rel'] === 'http://microformats.org/profile/hcard')
+ $hcard = $link['@attributes']['href'];
+ }
+ }
+ return $profile_link;
+ }
+
+ /**
+ * @brief Check an URI for LRDD data
+ *
+ * this is a replacement for the "lrdd" function in include/network.php.
+ * It isn't used in this class and has some redundancies in the code.
+ * When time comes we can check the existing calls for "lrdd" if we can rework them.
+ *
+ * @param string $uri Address that should be probed
+ *
+ * @return array uri data
+ */
+ public static function lrdd($uri) {
+
+ $lrdd = self::xrd($uri);
+
+ if (!$lrdd) {
+ $parts = @parse_url($uri);
+ if (!$parts)
+ return array();
+
+ $host = $parts["host"];
+
+ $path_parts = explode("/", trim($parts["path"], "/"));
+
+ do {
+ $lrdd = self::xrd($host);
+ $host .= "/".array_shift($path_parts);
+ } while (!$lrdd AND (sizeof($path_parts) > 0));
+ }
+
+ if (!$lrdd)
+ return array();
+
+ foreach ($lrdd AS $key => $link) {
+ if ($webfinger)
+ continue;
+
+ if (!in_array($key, array("lrdd", "lrdd-xml", "lrdd-json")))
+ continue;
+
+ $path = str_replace('{uri}', urlencode($uri), $link);
+ $webfinger = self::webfinger($path);
+
+ if (!$webfinger AND (strstr($uri, "@"))) {
+ $path = str_replace('{uri}', urlencode("acct:".$uri), $link);
+ $webfinger = self::webfinger($path);
+ }
+ }
+
+ if (!is_array($webfinger["links"]))
+ return false;
+
+ $data = array();
+
+ foreach ($webfinger["links"] AS $link)
+ $data[] = array("@attributes" => $link);
+
+ if (is_array($webfinger["aliases"]))
+ foreach ($webfinger["aliases"] AS $alias)
+ $data[] = array("@attributes" =>
+ array("rel" => "alias",
+ "href" => $alias));
+
+ return $data;
+ }
+
+ /**
+ * @brief Fetch information (protocol endpoints and user information) about a given uri
*
* @param string $uri Address that should be probed
* @param string $network Test for this specific network
if ($cache) {
$result = Cache::get("probe_url:".$network.":".$uri);
if (!is_null($result)) {
- $result = unserialize($result);
return $result;
}
}
else
$data["photo"] = App::get_baseurl().'/images/person-175.jpg';
- if (!isset($data["name"]))
- $data["name"] = $data["url"];
+ if (!isset($data["name"]) OR ($data["name"] == "")) {
+ if (isset($data["nick"]))
+ $data["name"] = $data["nick"];
+
+ if ($data["name"] == "")
+ $data["name"] = $data["url"];
+ }
- if (!isset($data["nick"])) {
+ if (!isset($data["nick"]) OR ($data["nick"] == "")) {
$data["nick"] = strtolower($data["name"]);
if (strpos($data['nick'], ' '))
// Only store into the cache if the value seems to be valid
if (!in_array($data['network'], array(NETWORK_PHANTOM, NETWORK_MAIL))) {
- Cache::set("probe_url:".$network.":".$uri,serialize($data), CACHE_DAY);
+ Cache::set("probe_url:".$network.":".$uri, $data, CACHE_DAY);
/// @todo temporary fix - we need a real contact update function that updates only changing fields
/// The biggest problem is the avatar picture that could have a reduced image size.
}
/**
- * @brief Detect information about a given uri
+ * @brief Fetch information (protocol endpoints and user information) about a given uri
+ *
+ * This function is only called by the "uri" function that adds caching and rearranging of data.
*
* @param string $uri Address that should be probed
* @param string $network Test for this specific network
*/
private function detect($uri, $network, $uid) {
if (strstr($uri, '@')) {
- // If the URI starts with "mailto:" then jum directly to the mail detection
+ // If the URI starts with "mailto:" then jump directly to the mail detection
if (strpos($url,'mailto:') !== false) {
$uri = str_replace('mailto:', '', $url);
return self::mail($uri, $uid);
return array("network" => NETWORK_TWITTER);
$lrdd = self::xrd($host);
+
if (!$lrdd)
return self::mail($uri, $uid);
$path = str_replace('{uri}', urlencode($addr), $link);
$webfinger = self::webfinger($path);
+ // Mastodon needs to have it with "acct:"
+ if (!$webfinger) {
+ $path = str_replace('{uri}', urlencode("acct:".$addr), $link);
+ $webfinger = self::webfinger($path);
+ }
+
// If webfinger wasn't successful then try it with the URL - possibly in the format https://...
if (!$webfinger AND ($uri != $addr)) {
$path = str_replace('{uri}', urlencode($uri), $link);
}
/**
- * @brief Do a webfinger request
+ * @brief Perform a webfinger request.
+ *
+ * For details see RFC 7033: <https://tools.ietf.org/html/rfc7033>
*
* @param string $url Address that should be probed
*
}
/**
- * @brief Poll the noscrape page (Friendica specific)
+ * @brief Poll the Friendica specific noscrape page.
+ *
+ * "noscrape" is a faster alternative to fetch the data from the hcard.
+ * This functionality was originally created for the directory.
*
* @param string $noscrape Link to the noscrape page
* @param array $data The already fetched data
}
/**
- * @brief Fetch data from a DFRN profile page
+ * @brief Fetch data from a DFRN profile page and via "noscrape"
*
* @param string $profile Link to the profile page
*
*/
private function poll_hcard($hcard, $data, $dfrn = false) {
+ $content = fetch_url($hcard);
+ if (!$content)
+ return false;
+
$doc = new DOMDocument();
- if (!@$doc->loadHTMLFile($hcard))
+ if (!@$doc->loadHTML($content))
return false;
$xpath = new DomXPath($doc);
if (!is_object($vcards))
return false;
- if ($vcards->length == 0)
- return false;
+ if ($vcards->length > 0) {
+ $vcard = $vcards->item(0);
- $vcard = $vcards->item(0);
+ // We have to discard the guid from the hcard in favour of the guid from lrdd
+ // Reason: Hubzilla doesn't use the value "uid" in the hcard like Diaspora does.
+ $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' uid ')]", $vcard); // */
+ if (($search->length > 0) AND ($data["guid"] == ""))
+ $data["guid"] = $search->item(0)->nodeValue;
- // We have to discard the guid from the hcard in favour of the guid from lrdd
- // Reason: Hubzilla doesn't use the value "uid" in the hcard like Diaspora does.
- $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' uid ')]", $vcard); // */
- if (($search->length > 0) AND ($data["guid"] == ""))
- $data["guid"] = $search->item(0)->nodeValue;
+ $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' nickname ')]", $vcard); // */
+ if ($search->length > 0)
+ $data["nick"] = $search->item(0)->nodeValue;
- $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' nickname ')]", $vcard); // */
- if ($search->length > 0)
- $data["nick"] = $search->item(0)->nodeValue;
+ $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' fn ')]", $vcard); // */
+ if ($search->length > 0)
+ $data["name"] = $search->item(0)->nodeValue;
- $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' fn ')]", $vcard); // */
- if ($search->length > 0)
- $data["name"] = $search->item(0)->nodeValue;
+ $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' searchable ')]", $vcard); // */
+ if ($search->length > 0)
+ $data["searchable"] = $search->item(0)->nodeValue;
- $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' searchable ')]", $vcard); // */
- if ($search->length > 0)
- $data["searchable"] = $search->item(0)->nodeValue;
+ $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' key ')]", $vcard); // */
+ if ($search->length > 0) {
+ $data["pubkey"] = $search->item(0)->nodeValue;
+ if (strstr($data["pubkey"], 'RSA '))
+ $data["pubkey"] = rsatopem($data["pubkey"]);
+ }
- $search = $xpath->query("//*[contains(concat(' ', @class, ' '), ' key ')]", $vcard); // */
- if ($search->length > 0) {
- $data["pubkey"] = $search->item(0)->nodeValue;
- if (strstr($data["pubkey"], 'RSA '))
- $data["pubkey"] = rsatopem($data["pubkey"]);
+ $search = $xpath->query("//*[@id='pod_location']", $vcard); // */
+ if ($search->length > 0)
+ $data["baseurl"] = trim($search->item(0)->nodeValue, "/");
}
- $search = $xpath->query("//*[@id='pod_location']", $vcard); // */
- if ($search->length > 0)
- $data["baseurl"] = trim($search->item(0)->nodeValue, "/");
-
$avatar = array();
$photos = $xpath->query("//*[contains(concat(' ', @class, ' '), ' photo ') or contains(concat(' ', @class, ' '), ' avatar ')]", $vcard); // */
foreach ($photos AS $photo) {
isset($data["pubkey"]) AND ($hcard != "")) {
$data["network"] = NETWORK_DIASPORA;
+ // The Diaspora handle must always be lowercase
+ $data["addr"] = strtolower($data["addr"]);
+
// We have to overwrite the detected value for "notify" since Hubzilla doesn't send it
$data["notify"] = $data["baseurl"]."/receive/users/".$data["guid"];
$data["batch"] = $data["baseurl"]."/receive/public";
if (strstr($alias, "@"))
$data["addr"] = str_replace('acct:', '', $alias);
+ if (is_string($webfinger["subject"]) AND strstr($webfinger["subject"], "@"))
+ $data["addr"] = str_replace('acct:', '', $webfinger["subject"]);
+
$pubkey = "";
foreach ($webfinger["links"] AS $link) {
if (($link["rel"] == "http://webfinger.net/rel/profile-page") AND
$pubkey = substr($pubkey, strpos($pubkey, ',') + 1);
else
$pubkey = substr($pubkey, 5);
- } else
+ } elseif (normalise_link($pubkey) == 'http://')
$pubkey = fetch_url($pubkey);
$key = explode(".", $pubkey);