2017-11-18 11:02:46 +00:00
|
|
|
<?php
|
|
|
|
/**
|
|
|
|
* @file src/Worker/DiscoverPoCo.php
|
|
|
|
*/
|
|
|
|
namespace Friendica\Worker;
|
|
|
|
|
|
|
|
use Friendica\Core\Cache;
|
|
|
|
use Friendica\Core\Config;
|
2018-08-11 20:40:44 +00:00
|
|
|
use Friendica\Core\Protocol;
|
2017-11-18 11:02:46 +00:00
|
|
|
use Friendica\Core\Worker;
|
2018-07-20 12:19:26 +00:00
|
|
|
use Friendica\Database\DBA;
|
2017-12-07 14:09:28 +00:00
|
|
|
use Friendica\Model\GContact;
|
2017-11-18 11:02:46 +00:00
|
|
|
use Friendica\Network\Probe;
|
|
|
|
use Friendica\Protocol\PortableContact;
|
2018-01-27 02:38:34 +00:00
|
|
|
use Friendica\Util\DateTimeFormat;
|
2018-01-27 04:09:48 +00:00
|
|
|
use Friendica\Util\Network;
|
2017-11-18 11:02:46 +00:00
|
|
|
|
2018-07-10 02:39:59 +00:00
|
|
|
class DiscoverPoCo
|
|
|
|
{
|
2017-11-18 11:02:46 +00:00
|
|
|
/// @todo Clean up this mess of a parameter hell and split it in several classes
|
2017-11-19 00:14:20 +00:00
|
|
|
public static function execute($command = '', $param1 = '', $param2 = '', $param3 = '', $param4 = '')
|
2017-11-18 11:02:46 +00:00
|
|
|
{
|
|
|
|
/*
|
|
|
|
This function can be called in these ways:
|
|
|
|
- dirsearch <search pattern>: Searches for "search pattern" in the directory. "search pattern" is url encoded.
|
|
|
|
- checkcontact: Updates gcontact entries
|
|
|
|
- suggestions: Discover other servers for their contacts.
|
|
|
|
- server <poco url>: Searches for the poco server list. "poco url" is base64 encoded.
|
|
|
|
- update_server: Frequently check the first 250 servers for vitality.
|
|
|
|
- update_server_directory: Discover the given server id for their contacts
|
|
|
|
- PortableContact::load: Load POCO data from a given POCO address
|
|
|
|
- check_profile: Update remote profile data
|
|
|
|
*/
|
|
|
|
|
2018-02-14 05:05:00 +00:00
|
|
|
$search = "";
|
|
|
|
$mode = 0;
|
2017-11-18 11:02:46 +00:00
|
|
|
if ($command == "dirsearch") {
|
|
|
|
$search = urldecode($param1);
|
|
|
|
$mode = 1;
|
|
|
|
} elseif ($command == "checkcontact") {
|
|
|
|
$mode = 2;
|
|
|
|
} elseif ($command == "suggestions") {
|
|
|
|
$mode = 3;
|
|
|
|
} elseif ($command == "server") {
|
|
|
|
$mode = 4;
|
|
|
|
} elseif ($command == "update_server") {
|
|
|
|
$mode = 5;
|
|
|
|
} elseif ($command == "update_server_directory") {
|
|
|
|
$mode = 6;
|
|
|
|
} elseif ($command == "load") {
|
|
|
|
$mode = 7;
|
|
|
|
} elseif ($command == "check_profile") {
|
|
|
|
$mode = 8;
|
2018-02-14 05:05:00 +00:00
|
|
|
} elseif ($command !== "") {
|
2017-11-18 11:02:46 +00:00
|
|
|
logger("Unknown or missing parameter ".$command."\n");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
logger('start '.$search);
|
|
|
|
|
|
|
|
if ($mode == 8) {
|
|
|
|
if ($param1 != "") {
|
|
|
|
PortableContact::lastUpdated($param1, true);
|
|
|
|
}
|
|
|
|
} elseif ($mode == 7) {
|
|
|
|
if (!empty($param4)) {
|
|
|
|
$url = $param4;
|
|
|
|
} else {
|
|
|
|
$url = '';
|
|
|
|
}
|
|
|
|
PortableContact::load(intval($param1), intval($param2), intval($param3), $url);
|
|
|
|
} elseif ($mode == 6) {
|
|
|
|
PortableContact::discoverSingleServer(intval($param1));
|
|
|
|
} elseif ($mode == 5) {
|
|
|
|
self::updateServer();
|
|
|
|
} elseif ($mode == 4) {
|
|
|
|
$server_url = $param1;
|
|
|
|
if ($server_url == "") {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
$server_url = filter_var($server_url, FILTER_SANITIZE_URL);
|
|
|
|
if (substr(normalise_link($server_url), 0, 7) != "http://") {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
$result = "Checking server ".$server_url." - ";
|
|
|
|
$ret = PortableContact::checkServer($server_url);
|
|
|
|
if ($ret) {
|
|
|
|
$result .= "success";
|
|
|
|
} else {
|
|
|
|
$result .= "failed";
|
|
|
|
}
|
|
|
|
logger($result, LOGGER_DEBUG);
|
|
|
|
} elseif ($mode == 3) {
|
2017-12-07 14:09:28 +00:00
|
|
|
GContact::updateSuggestions();
|
2017-11-18 11:02:46 +00:00
|
|
|
} elseif (($mode == 2) && Config::get('system', 'poco_completion')) {
|
|
|
|
self::discoverUsers();
|
|
|
|
} elseif (($mode == 1) && ($search != "") && Config::get('system', 'poco_local_search')) {
|
|
|
|
self::discoverDirectory($search);
|
|
|
|
self::gsSearchUser($search);
|
|
|
|
} elseif (($mode == 0) && ($search == "") && (Config::get('system', 'poco_discovery') > 0)) {
|
|
|
|
// Query Friendica and Hubzilla servers for their users
|
|
|
|
PortableContact::discover();
|
|
|
|
|
|
|
|
// Query GNU Social servers for their users ("statistics" addon has to be enabled on the GS server)
|
|
|
|
if (!Config::get('system', 'ostatus_disabled')) {
|
2017-12-07 14:09:28 +00:00
|
|
|
GContact::discoverGsUsers();
|
2017-11-18 11:02:46 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
logger('end '.$search);
|
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @brief Updates the first 250 servers
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
private static function updateServer() {
|
|
|
|
$r = q("SELECT `url`, `created`, `last_failure`, `last_contact` FROM `gserver` ORDER BY rand()");
|
|
|
|
|
2018-07-21 12:46:04 +00:00
|
|
|
if (!DBA::isResult($r)) {
|
2017-11-18 11:02:46 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
$updated = 0;
|
|
|
|
|
|
|
|
foreach ($r AS $server) {
|
|
|
|
if (!PortableContact::updateNeeded($server["created"], "", $server["last_failure"], $server["last_contact"])) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
logger('Update server status for server '.$server["url"], LOGGER_DEBUG);
|
|
|
|
|
|
|
|
Worker::add(PRIORITY_LOW, "DiscoverPoCo", "server", $server["url"]);
|
|
|
|
|
|
|
|
if (++$updated > 250) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private static function discoverUsers() {
|
|
|
|
logger("Discover users", LOGGER_DEBUG);
|
|
|
|
|
|
|
|
$starttime = time();
|
|
|
|
|
|
|
|
$users = q("SELECT `url`, `created`, `updated`, `last_failure`, `last_contact`, `server_url`, `network` FROM `gcontact`
|
|
|
|
WHERE `last_contact` < UTC_TIMESTAMP - INTERVAL 1 MONTH AND
|
|
|
|
`last_failure` < UTC_TIMESTAMP - INTERVAL 1 MONTH AND
|
|
|
|
`network` IN ('%s', '%s', '%s', '%s', '') ORDER BY rand()",
|
2018-08-11 20:40:44 +00:00
|
|
|
DBA::escape(Protocol::DFRN), DBA::escape(Protocol::DIASPORA),
|
|
|
|
DBA::escape(Protocol::OSTATUS), DBA::escape(Protocol::FEED));
|
2017-11-18 11:02:46 +00:00
|
|
|
|
|
|
|
if (!$users) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
$checked = 0;
|
|
|
|
|
|
|
|
foreach ($users AS $user) {
|
|
|
|
|
|
|
|
$urlparts = parse_url($user["url"]);
|
|
|
|
if (!isset($urlparts["scheme"])) {
|
2018-08-11 20:40:44 +00:00
|
|
|
DBA::update('gcontact', ['network' => Protocol::PHANTOM],
|
2018-04-09 21:34:23 +00:00
|
|
|
['nurl' => normalise_link($user["url"])]);
|
2017-11-18 11:02:46 +00:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2018-08-07 15:06:51 +00:00
|
|
|
if (in_array($urlparts["host"], ["twitter.com", "identi.ca"])) {
|
2018-08-11 20:40:44 +00:00
|
|
|
$networks = ["twitter.com" => Protocol::TWITTER, "identi.ca" => Protocol::PUMPIO];
|
2017-11-18 11:02:46 +00:00
|
|
|
|
2018-07-20 12:19:26 +00:00
|
|
|
DBA::update('gcontact', ['network' => $networks[$urlparts["host"]]],
|
2018-04-09 21:34:23 +00:00
|
|
|
['nurl' => normalise_link($user["url"])]);
|
2017-11-18 11:02:46 +00:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
$server_url = PortableContact::detectServer($user["url"]);
|
|
|
|
$force_update = false;
|
|
|
|
|
|
|
|
if ($user["server_url"] != "") {
|
|
|
|
|
|
|
|
$force_update = (normalise_link($user["server_url"]) != normalise_link($server_url));
|
|
|
|
|
|
|
|
$server_url = $user["server_url"];
|
|
|
|
}
|
|
|
|
|
2018-08-11 20:40:44 +00:00
|
|
|
if ((($server_url == "") && ($user["network"] == Protocol::FEED)) || $force_update || PortableContact::checkServer($server_url, $user["network"])) {
|
2017-11-18 11:02:46 +00:00
|
|
|
logger('Check profile '.$user["url"]);
|
|
|
|
Worker::add(PRIORITY_LOW, "DiscoverPoCo", "check_profile", $user["url"]);
|
|
|
|
|
|
|
|
if (++$checked > 100) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
} else {
|
2018-07-20 12:19:26 +00:00
|
|
|
DBA::update('gcontact', ['last_failure' => DateTimeFormat::utcNow()],
|
2018-04-09 21:34:23 +00:00
|
|
|
['nurl' => normalise_link($user["url"])]);
|
2017-11-18 11:02:46 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Quit the loop after 3 minutes
|
|
|
|
if (time() > ($starttime + 180)) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private static function discoverDirectory($search) {
|
|
|
|
|
|
|
|
$data = Cache::get("dirsearch:".$search);
|
|
|
|
if (!is_null($data)) {
|
|
|
|
// Only search for the same item every 24 hours
|
|
|
|
if (time() < $data + (60 * 60 * 24)) {
|
|
|
|
logger("Already searched for ".$search." in the last 24 hours", LOGGER_DEBUG);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-01-27 16:13:41 +00:00
|
|
|
$x = Network::fetchUrl(get_server()."/lsearch?p=1&n=500&search=".urlencode($search));
|
2017-11-18 11:02:46 +00:00
|
|
|
$j = json_decode($x);
|
|
|
|
|
2018-08-21 15:35:09 +00:00
|
|
|
if (!empty($j->results)) {
|
2017-11-18 11:02:46 +00:00
|
|
|
foreach ($j->results as $jj) {
|
|
|
|
// Check if the contact already exists
|
|
|
|
$exists = q("SELECT `id`, `last_contact`, `last_failure`, `updated` FROM `gcontact` WHERE `nurl` = '%s'", normalise_link($jj->url));
|
2018-07-21 12:46:04 +00:00
|
|
|
if (DBA::isResult($exists)) {
|
2017-11-18 11:02:46 +00:00
|
|
|
logger("Profile ".$jj->url." already exists (".$search.")", LOGGER_DEBUG);
|
|
|
|
|
|
|
|
if (($exists[0]["last_contact"] < $exists[0]["last_failure"]) &&
|
|
|
|
($exists[0]["updated"] < $exists[0]["last_failure"])) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
// Update the contact
|
|
|
|
PortableContact::lastUpdated($jj->url);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
$server_url = PortableContact::detectServer($jj->url);
|
|
|
|
if ($server_url != '') {
|
|
|
|
if (!PortableContact::checkServer($server_url)) {
|
|
|
|
logger("Friendica server ".$server_url." doesn't answer.", LOGGER_DEBUG);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
logger("Friendica server ".$server_url." seems to be okay.", LOGGER_DEBUG);
|
|
|
|
}
|
|
|
|
|
|
|
|
$data = Probe::uri($jj->url);
|
2018-08-11 20:40:44 +00:00
|
|
|
if ($data["network"] == Protocol::DFRN) {
|
2017-11-18 11:02:46 +00:00
|
|
|
logger("Profile ".$jj->url." is reachable (".$search.")", LOGGER_DEBUG);
|
|
|
|
logger("Add profile ".$jj->url." to local directory (".$search.")", LOGGER_DEBUG);
|
|
|
|
|
|
|
|
if ($jj->tags != "") {
|
|
|
|
$data["keywords"] = $jj->tags;
|
|
|
|
}
|
|
|
|
|
|
|
|
$data["server_url"] = $data["baseurl"];
|
|
|
|
|
2017-12-07 14:09:28 +00:00
|
|
|
GContact::update($data);
|
2017-11-18 11:02:46 +00:00
|
|
|
} else {
|
|
|
|
logger("Profile ".$jj->url." is not responding or no Friendica contact - but network ".$data["network"], LOGGER_DEBUG);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2018-10-20 16:19:55 +00:00
|
|
|
Cache::set("dirsearch:".$search, time(), Cache::DAY);
|
2017-11-18 11:02:46 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @brief Search for GNU Social user with gstools.org
|
|
|
|
*
|
2017-12-17 20:27:50 +00:00
|
|
|
* @param string $search User name
|
2017-11-18 11:02:46 +00:00
|
|
|
*/
|
|
|
|
private static function gsSearchUser($search) {
|
|
|
|
|
|
|
|
// Currently disabled, since the service isn't available anymore.
|
|
|
|
// It is not removed since I hope that there will be a successor.
|
|
|
|
return false;
|
|
|
|
|
|
|
|
$url = "http://gstools.org/api/users_search/".urlencode($search);
|
|
|
|
|
2018-10-10 19:08:43 +00:00
|
|
|
$curlResult = Network::curl($url);
|
|
|
|
if (!$curlResult->isSuccess()) {
|
2017-11-18 11:02:46 +00:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2018-10-10 19:08:43 +00:00
|
|
|
$contacts = json_decode($curlResult->getBody());
|
2017-11-18 11:02:46 +00:00
|
|
|
|
|
|
|
if ($contacts->status == 'ERROR') {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// @TODO AS is considered as a notation for constants (as they usually being written all upper-case)
|
|
|
|
/// @TODO find all those and convert to all lower-case which is a keyword then
|
|
|
|
foreach ($contacts->data AS $user) {
|
|
|
|
$contact = Probe::uri($user->site_address."/".$user->name);
|
2018-08-11 20:40:44 +00:00
|
|
|
if ($contact["network"] != Protocol::PHANTOM) {
|
2017-11-18 11:02:46 +00:00
|
|
|
$contact["about"] = $user->description;
|
2017-12-07 14:09:28 +00:00
|
|
|
GContact::update($contact);
|
2017-11-18 11:02:46 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|