2015-07-18 22:26:06 +02:00
|
|
|
<?php
|
|
|
|
|
|
|
|
require_once("boot.php");
|
|
|
|
require_once("include/socgraph.php");
|
|
|
|
|
|
|
|
|
|
|
|
function discover_poco_run(&$argv, &$argc){
|
|
|
|
global $a, $db;
|
|
|
|
|
|
|
|
if(is_null($a)) {
|
|
|
|
$a = new App;
|
|
|
|
}
|
|
|
|
|
|
|
|
if(is_null($db)) {
|
|
|
|
@include(".htconfig.php");
|
2015-07-29 06:31:18 +02:00
|
|
|
require_once("include/dba.php");
|
2015-07-18 22:26:06 +02:00
|
|
|
$db = new dba($db_host, $db_user, $db_pass, $db_data);
|
2015-07-29 06:31:18 +02:00
|
|
|
unset($db_host, $db_user, $db_pass, $db_data);
|
|
|
|
};
|
2015-07-18 22:26:06 +02:00
|
|
|
|
|
|
|
require_once('include/session.php');
|
|
|
|
require_once('include/datetime.php');
|
|
|
|
require_once('include/pidfile.php');
|
|
|
|
|
|
|
|
load_config('config');
|
|
|
|
load_config('system');
|
|
|
|
|
2016-03-08 00:20:06 +01:00
|
|
|
// Don't check this stuff if the function is called by the poller
|
|
|
|
if (App::callstack() != "poller_run") {
|
|
|
|
$maxsysload = intval(get_config('system','maxloadavg'));
|
|
|
|
if($maxsysload < 1)
|
|
|
|
$maxsysload = 50;
|
2015-12-15 23:26:58 +01:00
|
|
|
|
2016-03-08 00:20:06 +01:00
|
|
|
$load = current_load();
|
|
|
|
if($load) {
|
|
|
|
if(intval($load) > $maxsysload) {
|
|
|
|
logger('system: load '.$load.' too high. discover_poco deferred to next scheduled run.');
|
|
|
|
return;
|
|
|
|
}
|
2015-07-18 22:26:06 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-07-19 18:02:24 +02:00
|
|
|
if(($argc > 2) && ($argv[1] == "dirsearch")) {
|
|
|
|
$search = urldecode($argv[2]);
|
2015-07-26 14:41:34 +02:00
|
|
|
$mode = 1;
|
|
|
|
} elseif(($argc == 2) && ($argv[1] == "checkcontact")) {
|
|
|
|
$mode = 2;
|
2015-11-07 17:52:52 +01:00
|
|
|
} elseif(($argc == 2) && ($argv[1] == "suggestions")) {
|
|
|
|
$mode = 3;
|
2015-07-19 18:02:24 +02:00
|
|
|
} elseif ($argc == 1) {
|
|
|
|
$search = "";
|
2015-07-26 14:41:34 +02:00
|
|
|
$mode = 0;
|
2015-07-19 18:02:24 +02:00
|
|
|
} else
|
|
|
|
die("Unknown or missing parameter ".$argv[1]."\n");
|
|
|
|
|
2016-03-08 00:20:06 +01:00
|
|
|
// Don't check this stuff if the function is called by the poller
|
|
|
|
if (App::callstack() != "poller_run") {
|
|
|
|
$lockpath = get_lockpath();
|
|
|
|
if ($lockpath != '') {
|
|
|
|
$pidfile = new pidfile($lockpath, 'discover_poco'.$mode.urlencode($search));
|
|
|
|
if($pidfile->is_already_running()) {
|
|
|
|
logger("discover_poco: Already running");
|
|
|
|
if ($pidfile->running_time() > 19*60) {
|
|
|
|
$pidfile->kill();
|
|
|
|
logger("discover_poco: killed stale process");
|
|
|
|
// Calling a new instance
|
|
|
|
if ($mode == 0)
|
|
|
|
proc_run('php','include/discover_poco.php');
|
|
|
|
}
|
|
|
|
exit;
|
2015-07-29 06:31:18 +02:00
|
|
|
}
|
2015-07-18 22:26:06 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
$a->set_baseurl(get_config('system','url'));
|
|
|
|
|
|
|
|
load_hooks();
|
|
|
|
|
2015-07-19 18:02:24 +02:00
|
|
|
logger('start '.$search);
|
2015-07-18 22:26:06 +02:00
|
|
|
|
2015-11-07 17:52:52 +01:00
|
|
|
if ($mode==3)
|
|
|
|
update_suggestions();
|
|
|
|
elseif (($mode == 2) AND get_config('system','poco_completion'))
|
2015-07-26 14:41:34 +02:00
|
|
|
discover_users();
|
2016-01-21 19:00:08 +01:00
|
|
|
elseif (($mode == 1) AND ($search != "") and get_config('system','poco_local_search')) {
|
2015-07-19 18:02:24 +02:00
|
|
|
discover_directory($search);
|
2016-01-21 19:00:08 +01:00
|
|
|
gs_search_user($search);
|
|
|
|
} elseif (($mode == 0) AND ($search == "") and (get_config('system','poco_discovery') > 0)) {
|
2016-01-19 15:12:18 +01:00
|
|
|
// Query Friendica and Hubzilla servers for their users
|
2015-07-18 22:26:06 +02:00
|
|
|
poco_discover();
|
|
|
|
|
2016-01-19 15:12:18 +01:00
|
|
|
// Query GNU Social servers for their users ("statistics" addon has to be enabled on the GS server)
|
|
|
|
if (!get_config('system','ostatus_disabled'))
|
|
|
|
gs_discover();
|
|
|
|
}
|
|
|
|
|
2015-07-19 18:02:24 +02:00
|
|
|
logger('end '.$search);
|
2015-07-18 22:26:06 +02:00
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2015-07-26 14:41:34 +02:00
|
|
|
function discover_users() {
|
2015-07-26 17:14:32 +02:00
|
|
|
logger("Discover users", LOGGER_DEBUG);
|
2015-07-27 08:14:04 +02:00
|
|
|
|
2015-07-26 16:52:37 +02:00
|
|
|
$users = q("SELECT `url`, `created`, `updated`, `last_failure`, `last_contact`, `server_url` FROM `gcontact`
|
2015-07-27 08:14:04 +02:00
|
|
|
WHERE `last_contact` < UTC_TIMESTAMP - INTERVAL 1 MONTH AND
|
|
|
|
`last_failure` < UTC_TIMESTAMP - INTERVAL 1 MONTH AND
|
2015-07-28 15:28:58 +02:00
|
|
|
`network` IN ('%s', '%s', '%s', '%s', '') ORDER BY rand()",
|
|
|
|
dbesc(NETWORK_DFRN), dbesc(NETWORK_DIASPORA),
|
|
|
|
dbesc(NETWORK_OSTATUS), dbesc(NETWORK_FEED));
|
2015-07-26 14:41:34 +02:00
|
|
|
|
|
|
|
if (!$users)
|
|
|
|
return;
|
|
|
|
|
2015-07-26 16:52:37 +02:00
|
|
|
$checked = 0;
|
|
|
|
|
2015-07-26 14:41:34 +02:00
|
|
|
foreach ($users AS $user) {
|
2015-07-28 18:26:30 +02:00
|
|
|
|
2015-07-29 06:31:18 +02:00
|
|
|
$urlparts = parse_url($user["url"]);
|
|
|
|
if (!isset($urlparts["scheme"])) {
|
|
|
|
q("UPDATE `gcontact` SET `network` = '%s' WHERE `nurl` = '%s'",
|
|
|
|
dbesc(NETWORK_PHANTOM), dbesc(normalise_link($user["url"])));
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (in_array($urlparts["host"], array("www.facebook.com", "facebook.com", "twitter.com",
|
|
|
|
"identi.ca", "alpha.app.net"))) {
|
|
|
|
$networks = array("www.facebook.com" => NETWORK_FACEBOOK,
|
|
|
|
"facebook.com" => NETWORK_FACEBOOK,
|
|
|
|
"twitter.com" => NETWORK_TWITTER,
|
|
|
|
"identi.ca" => NETWORK_PUMPIO,
|
|
|
|
"alpha.app.net" => NETWORK_APPNET);
|
|
|
|
|
|
|
|
q("UPDATE `gcontact` SET `network` = '%s' WHERE `nurl` = '%s'",
|
|
|
|
dbesc($networks[$urlparts["host"]]), dbesc(normalise_link($user["url"])));
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($user["server_url"] != "")
|
|
|
|
$server_url = $user["server_url"];
|
2015-07-28 18:26:30 +02:00
|
|
|
else
|
|
|
|
$server_url = poco_detect_server($user["url"]);
|
|
|
|
|
2016-01-19 15:12:18 +01:00
|
|
|
if (($server_url == "") OR poco_check_server($server_url, $gcontacts[0]["network"])) {
|
2015-07-28 18:26:30 +02:00
|
|
|
logger('Check user '.$user["url"]);
|
|
|
|
poco_last_updated($user["url"], true);
|
|
|
|
|
|
|
|
if (++$checked > 100)
|
|
|
|
return;
|
|
|
|
} else
|
|
|
|
q("UPDATE `gcontact` SET `last_failure` = '%s' WHERE `nurl` = '%s'",
|
|
|
|
dbesc(datetime_convert()), dbesc(normalise_link($user["url"])));
|
2015-07-26 14:41:34 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-07-19 18:02:24 +02:00
|
|
|
function discover_directory($search) {
|
|
|
|
|
|
|
|
$data = Cache::get("dirsearch:".$search);
|
|
|
|
if (!is_null($data)){
|
|
|
|
// Only search for the same item every 24 hours
|
|
|
|
if (time() < $data + (60 * 60 * 24)) {
|
|
|
|
logger("Already searched for ".$search." in the last 24 hours", LOGGER_DEBUG);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-08-23 11:05:10 +02:00
|
|
|
$x = fetch_url(get_server()."/lsearch?p=1&n=500&search=".urlencode($search));
|
2015-07-19 18:02:24 +02:00
|
|
|
$j = json_decode($x);
|
|
|
|
|
|
|
|
if(count($j->results))
|
|
|
|
foreach($j->results as $jj) {
|
|
|
|
// Check if the contact already exists
|
2015-07-23 22:21:22 +02:00
|
|
|
$exists = q("SELECT `id`, `last_contact`, `last_failure`, `updated` FROM `gcontact` WHERE `nurl` = '%s'", normalise_link($jj->url));
|
2015-07-19 18:02:24 +02:00
|
|
|
if ($exists) {
|
|
|
|
logger("Profile ".$jj->url." already exists (".$search.")", LOGGER_DEBUG);
|
|
|
|
|
2015-07-23 22:21:22 +02:00
|
|
|
if (($exists[0]["last_contact"] < $exists[0]["last_failure"]) AND
|
|
|
|
($exists[0]["updated"] < $exists[0]["last_failure"]))
|
2015-07-19 18:02:24 +02:00
|
|
|
continue;
|
|
|
|
|
2015-07-19 21:29:24 +02:00
|
|
|
// Update the contact
|
|
|
|
poco_last_updated($jj->url);
|
2015-07-19 18:02:24 +02:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2015-07-19 21:29:24 +02:00
|
|
|
// Harcoded paths aren't so good. But in this case it is okay.
|
|
|
|
// First: We only will get Friendica contacts (which always are using this url schema)
|
|
|
|
// Second: There will be no further problems if we are doing a mistake
|
|
|
|
$server_url = preg_replace("=(https?://)(.*)/profile/(.*)=ism", "$1$2", $jj->url);
|
|
|
|
if ($server_url != $jj->url)
|
|
|
|
if (!poco_check_server($server_url)) {
|
|
|
|
logger("Friendica server ".$server_url." doesn't answer.", LOGGER_DEBUG);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
logger("Friendica server ".$server_url." seems to be okay.", LOGGER_DEBUG);
|
|
|
|
|
2015-07-19 18:02:24 +02:00
|
|
|
logger("Check if profile ".$jj->url." is reachable (".$search.")", LOGGER_DEBUG);
|
|
|
|
$data = probe_url($jj->url);
|
|
|
|
if ($data["network"] == NETWORK_DFRN) {
|
|
|
|
logger("Add profile ".$jj->url." to local directory (".$search.")", LOGGER_DEBUG);
|
|
|
|
poco_check($data["url"], $data["name"], $data["network"], $data["photo"], "", "", "", $jj->tags, $data["addr"], "", 0);
|
|
|
|
}
|
|
|
|
}
|
2015-08-24 17:24:14 +02:00
|
|
|
Cache::set("dirsearch:".$search, time(), CACHE_DAY);
|
2015-07-19 18:02:24 +02:00
|
|
|
}
|
|
|
|
|
2016-01-21 19:00:08 +01:00
|
|
|
/**
|
|
|
|
* @brief Search for GNU Social user with gstools.org
|
|
|
|
*
|
|
|
|
* @param str $search User name
|
|
|
|
*/
|
|
|
|
function gs_search_user($search) {
|
|
|
|
|
|
|
|
$a = get_app();
|
|
|
|
|
|
|
|
$url = "http://gstools.org/api/users_search/".urlencode($search);
|
|
|
|
|
|
|
|
$result = z_fetch_url($url);
|
|
|
|
if (!$result["success"])
|
|
|
|
return false;
|
|
|
|
|
|
|
|
$contacts = json_decode($result["body"]);
|
|
|
|
|
|
|
|
if ($contacts->status == 'ERROR')
|
|
|
|
return false;
|
|
|
|
|
|
|
|
foreach($contacts->data AS $user) {
|
|
|
|
$contact = probe_url($user->site_address."/".$user->name);
|
|
|
|
if ($contact["network"] != NETWORK_PHANTOM) {
|
|
|
|
$contact["about"] = $user->description;
|
|
|
|
update_gcontact($contact);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2015-07-18 22:26:06 +02:00
|
|
|
if (array_search(__file__,get_included_files())===0){
|
|
|
|
discover_poco_run($_SERVER["argv"],$_SERVER["argc"]);
|
|
|
|
killme();
|
|
|
|
}
|