197 lines
		
	
	
	
		
			5.8 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
			
		
		
	
	
			197 lines
		
	
	
	
		
			5.8 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
| <?php
 | |
| 
 | |
| require_once("boot.php");
 | |
| require_once("include/socgraph.php");
 | |
| 
 | |
| 
 | |
| function discover_poco_run(&$argv, &$argc){
 | |
| 	global $a, $db;
 | |
| 
 | |
| 	if(is_null($a)) {
 | |
| 		$a = new App;
 | |
| 	}
 | |
| 
 | |
| 	if(is_null($db)) {
 | |
| 	    @include(".htconfig.php");
 | |
| 	require_once("include/dba.php");
 | |
| 	    $db = new dba($db_host, $db_user, $db_pass, $db_data);
 | |
| 	unset($db_host, $db_user, $db_pass, $db_data);
 | |
| 	};
 | |
| 
 | |
| 	require_once('include/session.php');
 | |
| 	require_once('include/datetime.php');
 | |
| 	require_once('include/pidfile.php');
 | |
| 
 | |
| 	load_config('config');
 | |
| 	load_config('system');
 | |
| 
 | |
| 	$maxsysload = intval(get_config('system','maxloadavg'));
 | |
| 	if($maxsysload < 1)
 | |
| 		$maxsysload = 50;
 | |
| 
 | |
| 	$load = current_load();
 | |
| 	if($load) {
 | |
| 		if(intval($load) > $maxsysload) {
 | |
| 			logger('system: load ' . $load . ' too high. discover_poco deferred to next scheduled run.');
 | |
| 			return;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if(($argc > 2) && ($argv[1] == "dirsearch")) {
 | |
| 		$search = urldecode($argv[2]);
 | |
| 		$mode = 1;
 | |
| 	} elseif(($argc == 2) && ($argv[1] == "checkcontact")) {
 | |
| 		$mode = 2;
 | |
| 	} elseif(($argc == 2) && ($argv[1] == "suggestions")) {
 | |
| 		$mode = 3;
 | |
| 	} elseif ($argc == 1) {
 | |
| 		$search = "";
 | |
| 		$mode = 0;
 | |
| 	} else
 | |
| 		die("Unknown or missing parameter ".$argv[1]."\n");
 | |
| 
 | |
| 	$lockpath = get_lockpath();
 | |
| 	if ($lockpath != '') {
 | |
| 		$pidfile = new pidfile($lockpath, 'discover_poco'.$mode.urlencode($search));
 | |
| 		if($pidfile->is_already_running()) {
 | |
| 			logger("discover_poco: Already running");
 | |
| 			if ($pidfile->running_time() > 19*60) {
 | |
| 				$pidfile->kill();
 | |
| 				logger("discover_poco: killed stale process");
 | |
| 				// Calling a new instance
 | |
| 				if ($mode == 0)
 | |
| 					proc_run('php','include/discover_poco.php');
 | |
| 			}
 | |
| 			exit;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	$a->set_baseurl(get_config('system','url'));
 | |
| 
 | |
| 	load_hooks();
 | |
| 
 | |
| 	logger('start '.$search);
 | |
| 
 | |
| 	if ($mode==3)
 | |
| 		update_suggestions();
 | |
| 	elseif (($mode == 2) AND get_config('system','poco_completion'))
 | |
| 		discover_users();
 | |
| 	elseif (($mode == 1) AND ($search != "") and get_config('system','poco_local_search'))
 | |
| 		discover_directory($search);
 | |
| 	elseif (($mode == 0) AND ($search == "") and (get_config('system','poco_discovery') > 0))
 | |
| 		poco_discover();
 | |
| 
 | |
| 	logger('end '.$search);
 | |
| 
 | |
| 	return;
 | |
| }
 | |
| 
 | |
| function discover_users() {
 | |
| 	logger("Discover users", LOGGER_DEBUG);
 | |
| 
 | |
| 	$users = q("SELECT `url`, `created`, `updated`, `last_failure`, `last_contact`, `server_url` FROM `gcontact`
 | |
| 			WHERE `last_contact` < UTC_TIMESTAMP - INTERVAL 1 MONTH AND
 | |
| 				`last_failure` < UTC_TIMESTAMP - INTERVAL 1 MONTH AND
 | |
| 				`network` IN ('%s', '%s', '%s', '%s', '') ORDER BY rand()",
 | |
| 			dbesc(NETWORK_DFRN), dbesc(NETWORK_DIASPORA),
 | |
| 			dbesc(NETWORK_OSTATUS), dbesc(NETWORK_FEED));
 | |
| 
 | |
| 	if (!$users)
 | |
| 		return;
 | |
| 
 | |
| 	$checked = 0;
 | |
| 
 | |
| 	foreach ($users AS $user) {
 | |
| 
 | |
| 		$urlparts = parse_url($user["url"]);
 | |
| 		if (!isset($urlparts["scheme"])) {
 | |
| 			q("UPDATE `gcontact` SET `network` = '%s' WHERE `nurl` = '%s'",
 | |
| 				dbesc(NETWORK_PHANTOM), dbesc(normalise_link($user["url"])));
 | |
| 			continue;
 | |
| 		 }
 | |
| 
 | |
| 		if (in_array($urlparts["host"], array("www.facebook.com", "facebook.com", "twitter.com",
 | |
| 							"identi.ca", "alpha.app.net"))) {
 | |
| 			$networks = array("www.facebook.com" => NETWORK_FACEBOOK,
 | |
| 					"facebook.com" => NETWORK_FACEBOOK,
 | |
| 					"twitter.com" => NETWORK_TWITTER,
 | |
| 					"identi.ca" => NETWORK_PUMPIO,
 | |
| 					"alpha.app.net" => NETWORK_APPNET);
 | |
| 
 | |
| 			q("UPDATE `gcontact` SET `network` = '%s' WHERE `nurl` = '%s'",
 | |
| 				dbesc($networks[$urlparts["host"]]), dbesc(normalise_link($user["url"])));
 | |
| 			continue;
 | |
| 		}
 | |
| 
 | |
| 		if ($user["server_url"] != "")
 | |
| 			$server_url = $user["server_url"];
 | |
| 		else
 | |
| 			$server_url = poco_detect_server($user["url"]);
 | |
| 
 | |
| 		if (poco_check_server($server_url, $gcontacts[0]["network"])) {
 | |
| 			logger('Check user '.$user["url"]);
 | |
| 			poco_last_updated($user["url"], true);
 | |
| 
 | |
| 			if (++$checked > 100)
 | |
| 				return;
 | |
| 		} else
 | |
| 			q("UPDATE `gcontact` SET `last_failure` = '%s' WHERE `nurl` = '%s'",
 | |
| 				dbesc(datetime_convert()), dbesc(normalise_link($user["url"])));
 | |
| 	}
 | |
| }
 | |
| 
 | |
| function discover_directory($search) {
 | |
| 
 | |
| 	$data = Cache::get("dirsearch:".$search);
 | |
| 	if (!is_null($data)){
 | |
| 		// Only search for the same item every 24 hours
 | |
| 		if (time() < $data + (60 * 60 * 24)) {
 | |
| 			logger("Already searched for ".$search." in the last 24 hours", LOGGER_DEBUG);
 | |
| 			return;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	$x = fetch_url(get_server()."/lsearch?p=1&n=500&search=".urlencode($search));
 | |
| 	$j = json_decode($x);
 | |
| 
 | |
| 	if(count($j->results))
 | |
| 		foreach($j->results as $jj) {
 | |
| 			// Check if the contact already exists
 | |
| 			$exists = q("SELECT `id`, `last_contact`, `last_failure`, `updated` FROM `gcontact` WHERE `nurl` = '%s'", normalise_link($jj->url));
 | |
| 			if ($exists) {
 | |
| 				logger("Profile ".$jj->url." already exists (".$search.")", LOGGER_DEBUG);
 | |
| 
 | |
| 				if (($exists[0]["last_contact"] < $exists[0]["last_failure"]) AND
 | |
| 					($exists[0]["updated"] < $exists[0]["last_failure"]))
 | |
| 					continue;
 | |
| 
 | |
| 				// Update the contact
 | |
| 				poco_last_updated($jj->url);
 | |
| 				continue;
 | |
| 			}
 | |
| 
 | |
| 			// Harcoded paths aren't so good. But in this case it is okay.
 | |
| 			// First: We only will get Friendica contacts (which always are using this url schema)
 | |
| 			// Second: There will be no further problems if we are doing a mistake
 | |
| 			$server_url = preg_replace("=(https?://)(.*)/profile/(.*)=ism", "$1$2", $jj->url);
 | |
| 			if ($server_url != $jj->url)
 | |
| 				if (!poco_check_server($server_url)) {
 | |
| 					logger("Friendica server ".$server_url." doesn't answer.", LOGGER_DEBUG);
 | |
| 					continue;
 | |
| 				}
 | |
| 					logger("Friendica server ".$server_url." seems to be okay.", LOGGER_DEBUG);
 | |
| 
 | |
| 			logger("Check if profile ".$jj->url." is reachable (".$search.")", LOGGER_DEBUG);
 | |
| 			$data = probe_url($jj->url);
 | |
| 			if ($data["network"] == NETWORK_DFRN) {
 | |
| 				logger("Add profile ".$jj->url." to local directory (".$search.")", LOGGER_DEBUG);
 | |
| 				poco_check($data["url"], $data["name"], $data["network"], $data["photo"], "", "", "", $jj->tags, $data["addr"], "", 0);
 | |
| 			}
 | |
| 		}
 | |
| 	Cache::set("dirsearch:".$search, time(), CACHE_DAY);
 | |
| }
 | |
| 
 | |
| if (array_search(__file__,get_included_files())===0){
 | |
|   discover_poco_run($_SERVER["argv"],$_SERVER["argc"]);
 | |
|   killme();
 | |
| }
 |