2014-07-01 03:27:56 +02:00
|
|
|
<?php
|
|
|
|
|
|
|
|
require_once('datetime.php');
|
2014-07-10 23:43:25 +02:00
|
|
|
require_once('site-health.php');
|
2014-07-01 03:27:56 +02:00
|
|
|
|
2014-07-10 23:43:25 +02:00
|
|
|
function run_submit($url) {
|
2014-07-01 03:27:56 +02:00
|
|
|
|
2014-07-10 23:43:25 +02:00
|
|
|
global $a;
|
|
|
|
|
2014-07-01 03:27:56 +02:00
|
|
|
if(! strlen($url))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
logger('Updating: ' . $url);
|
2014-07-10 23:43:25 +02:00
|
|
|
|
|
|
|
//First run a notice script for the site it is hosted on.
|
|
|
|
$site_health = notice_site($url, true);
|
|
|
|
|
|
|
|
$submit_start = microtime(true);
|
|
|
|
|
2014-07-01 03:27:56 +02:00
|
|
|
$nurl = str_replace(array('https:','//www.'), array('http:','//'), $url);
|
|
|
|
|
|
|
|
$profile_exists = false;
|
|
|
|
|
2014-07-10 23:43:25 +02:00
|
|
|
$r = q("SELECT * FROM `profile` WHERE ( `homepage` = '%s' OR `nurl` = '%s' )",
|
2014-07-01 03:27:56 +02:00
|
|
|
dbesc($url),
|
|
|
|
dbesc($nurl)
|
|
|
|
);
|
|
|
|
|
|
|
|
if(count($r)) {
|
|
|
|
$profile_exists = true;
|
|
|
|
$profile_id = $r[0]['id'];
|
|
|
|
}
|
2014-07-10 23:43:25 +02:00
|
|
|
|
|
|
|
//Remove duplicates.
|
|
|
|
if(count($r) > 1){
|
|
|
|
for($i=1; $i<count($r); $i++){
|
|
|
|
logger('Removed duplicate profile '.intval($r[$i]['id']));
|
|
|
|
q("DELETE FROM `photo` WHERE `profile-id` = %d LIMIT 1",
|
|
|
|
intval($r[$i]['id'])
|
|
|
|
);
|
|
|
|
q("DELETE FROM `profile` WHERE `id` = %d LIMIT 1",
|
|
|
|
intval($r[$i]['id'])
|
|
|
|
);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-07-01 03:27:56 +02:00
|
|
|
require_once('Scrape.php');
|
|
|
|
|
2014-07-10 23:43:25 +02:00
|
|
|
//Skip the scrape? :D
|
|
|
|
$noscrape = $site_health && $site_health['no_scrape_url'];
|
|
|
|
if($noscrape){
|
|
|
|
|
|
|
|
//Find out who to look up.
|
|
|
|
$which = str_replace($site_health['base_url'], '', $url);
|
|
|
|
$noscrape = preg_match('~/profile/([^/]+)~', $which, $matches) === 1;
|
|
|
|
|
|
|
|
//If that did not fail...
|
|
|
|
if($noscrape){
|
|
|
|
$parms = noscrape_dfrn($site_health['no_scrape_url'].'/'.$matches[1]);
|
|
|
|
$noscrape = !!$parms; //If the result was false, do a scrape after all.
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
2014-07-01 03:27:56 +02:00
|
|
|
|
2014-07-10 23:43:25 +02:00
|
|
|
if(!$noscrape){
|
|
|
|
$parms = scrape_dfrn($url);
|
|
|
|
}
|
2014-07-01 03:27:56 +02:00
|
|
|
|
2014-07-10 23:43:25 +02:00
|
|
|
//Empty result is due to an offline site.
|
|
|
|
if(!count($parms)){
|
|
|
|
|
|
|
|
//For large sites this could lower the health too quickly, so don't track health.
|
|
|
|
//But for sites that are already in bad status. Do a cleanup now.
|
|
|
|
if($profile_exists && $site_health['health_score'] < $a->config['maintenance']['remove_profile_health_threshold']){
|
|
|
|
logger('Nuked bad health record.');
|
|
|
|
nuke_record($url);
|
|
|
|
}
|
|
|
|
|
2014-07-01 03:27:56 +02:00
|
|
|
return false;
|
2014-07-10 23:43:25 +02:00
|
|
|
|
2014-07-01 03:27:56 +02:00
|
|
|
}
|
2014-07-10 23:43:25 +02:00
|
|
|
|
|
|
|
//We don't care about valid dfrn if the user indicates to be hidden.
|
|
|
|
elseif($parms['explicit-hide'] && $profile_exists) {
|
|
|
|
logger('User opted out of the directory.');
|
|
|
|
nuke_record($url);
|
2014-07-11 01:35:30 +02:00
|
|
|
return true; //This is a good update.
|
2014-07-10 23:43:25 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
//This is most likely a problem with the site configuration. Ignore.
|
|
|
|
elseif(validate_dfrn($parms)) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2014-07-01 03:27:56 +02:00
|
|
|
if((x($parms,'hide')) || (! (x($parms,'fn')) && (x($parms,'photo')))) {
|
|
|
|
if($profile_exists) {
|
|
|
|
nuke_record($url);
|
|
|
|
}
|
2014-07-11 01:35:30 +02:00
|
|
|
return true; //This is a good update.
|
2014-07-01 03:27:56 +02:00
|
|
|
}
|
2014-07-10 23:43:25 +02:00
|
|
|
|
2014-07-01 03:27:56 +02:00
|
|
|
$photo = $parms['photo'];
|
|
|
|
|
|
|
|
dbesc_array($parms);
|
|
|
|
|
|
|
|
if(x($parms,'comm'))
|
|
|
|
$parms['comm'] = intval($parms['comm']);
|
|
|
|
|
|
|
|
if($profile_exists) {
|
|
|
|
$r = q("UPDATE `profile` SET
|
|
|
|
`name` = '%s',
|
|
|
|
`pdesc` = '%s',
|
|
|
|
`locality` = '%s',
|
|
|
|
`region` = '%s',
|
|
|
|
`postal-code` = '%s',
|
|
|
|
`country-name` = '%s',
|
|
|
|
`gender` = '%s',
|
|
|
|
`marital` = '%s',
|
|
|
|
`homepage` = '%s',
|
|
|
|
`nurl` = '%s',
|
|
|
|
`comm` = %d,
|
|
|
|
`tags` = '%s',
|
|
|
|
`updated` = '%s'
|
|
|
|
WHERE `id` = %d LIMIT 1",
|
|
|
|
|
|
|
|
$parms['fn'],
|
|
|
|
$parms['pdesc'],
|
|
|
|
$parms['locality'],
|
|
|
|
$parms['region'],
|
|
|
|
$parms['postal-code'],
|
|
|
|
$parms['country-name'],
|
|
|
|
$parms['gender'],
|
|
|
|
$parms['marital'],
|
|
|
|
dbesc($url),
|
|
|
|
dbesc($nurl),
|
|
|
|
intval($parms['comm']),
|
|
|
|
$parms['tags'],
|
|
|
|
dbesc(datetime_convert()),
|
|
|
|
intval($profile_id)
|
|
|
|
);
|
|
|
|
logger('Update returns: ' . $r);
|
|
|
|
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
$r = q("INSERT INTO `profile` ( `name`, `pdesc`, `locality`, `region`, `postal-code`, `country-name`, `gender`, `marital`, `homepage`, `nurl`, `comm`, `tags`, `created`, `updated` )
|
|
|
|
VALUES ( '%s', '%s', '%s', '%s' , '%s', '%s', '%s', '%s', '%s', '%s', %d, '%s', '%s', '%s' )",
|
|
|
|
$parms['fn'],
|
|
|
|
$parms['pdesc'],
|
|
|
|
$parms['locality'],
|
|
|
|
$parms['region'],
|
|
|
|
$parms['postal-code'],
|
|
|
|
$parms['country-name'],
|
|
|
|
$parms['gender'],
|
|
|
|
$parms['marital'],
|
|
|
|
dbesc($url),
|
|
|
|
dbesc($nurl),
|
|
|
|
intval($parms['comm']),
|
|
|
|
$parms['tags'],
|
|
|
|
dbesc(datetime_convert()),
|
|
|
|
dbesc(datetime_convert())
|
|
|
|
);
|
|
|
|
logger('Insert returns: ' . $r);
|
|
|
|
|
|
|
|
$r = q("SELECT `id` FROM `profile` WHERE ( `homepage` = '%s' or `nurl` = '%s' ) order by id asc",
|
|
|
|
dbesc($url),
|
|
|
|
dbesc($nurl)
|
|
|
|
);
|
|
|
|
|
|
|
|
if(count($r))
|
|
|
|
$profile_id = $r[count($r) - 1]['id'];
|
|
|
|
|
|
|
|
if(count($r) > 1) {
|
|
|
|
q("DELETE FROM `photo` WHERE `profile-id` = %d LIMIT 1",
|
|
|
|
intval($r[0]['id'])
|
|
|
|
);
|
|
|
|
q("DELETE FROM `profile` WHERE `id` = %d LIMIT 1",
|
|
|
|
intval($r[0]['id'])
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
if($parms['tags']) {
|
|
|
|
$arr = explode(' ', $parms['tags']);
|
|
|
|
if(count($arr)) {
|
|
|
|
foreach($arr as $t) {
|
|
|
|
$t = strip_tags(trim($t));
|
|
|
|
$t = substr($t,0,254);
|
|
|
|
|
|
|
|
if(strlen($t)) {
|
|
|
|
$r = q("SELECT `id` FROM `tag` WHERE `term` = '%s' and `nurl` = '%s' LIMIT 1",
|
|
|
|
dbesc($t),
|
|
|
|
dbesc($nurl)
|
|
|
|
);
|
|
|
|
if(! count($r)) {
|
|
|
|
$r = q("INSERT INTO `tag` (`term`, `nurl`) VALUES ('%s', '%s') ",
|
|
|
|
dbesc($t),
|
|
|
|
dbesc($nurl)
|
|
|
|
);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2014-07-10 23:43:25 +02:00
|
|
|
|
|
|
|
$submit_photo_start = microtime(true);
|
|
|
|
|
2014-07-01 03:27:56 +02:00
|
|
|
require_once("Photo.php");
|
|
|
|
|
|
|
|
$photo_failure = false;
|
2014-07-10 23:43:25 +02:00
|
|
|
|
|
|
|
$status = false;
|
|
|
|
|
2014-07-01 03:27:56 +02:00
|
|
|
if($profile_id) {
|
2014-07-11 01:35:30 +02:00
|
|
|
$img_str = fetch_url($photo,true);
|
|
|
|
$img = new Photo($img_str);
|
|
|
|
if($img) {
|
|
|
|
$img->scaleImageSquare(80);
|
|
|
|
$r = $img->store($profile_id);
|
|
|
|
}
|
2014-07-01 03:27:56 +02:00
|
|
|
$r = q("UPDATE `profile` SET `photo` = '%s' WHERE `id` = %d LIMIT 1",
|
|
|
|
dbesc($a->get_baseurl() . '/photo/' . $profile_id . '.jpg'),
|
|
|
|
intval($profile_id)
|
|
|
|
);
|
2014-07-10 23:43:25 +02:00
|
|
|
$status = true;
|
2014-07-01 03:27:56 +02:00
|
|
|
}
|
|
|
|
else{
|
|
|
|
nuke_record($url);
|
2014-07-11 01:35:30 +02:00
|
|
|
return false;
|
2014-07-01 03:27:56 +02:00
|
|
|
}
|
2014-07-10 23:43:25 +02:00
|
|
|
|
|
|
|
$submit_end = microtime(true);
|
|
|
|
$photo_time = round(($submit_end - $submit_photo_start) * 1000);
|
|
|
|
$time = round(($submit_end - $submit_start) * 1000);
|
|
|
|
|
|
|
|
//Record the scrape speed in a scrapes table.
|
|
|
|
if($site_health && $status) q(
|
|
|
|
"INSERT INTO `site-scrape` (`site_health_id`, `dt_performed`, `request_time`, `scrape_time`, `photo_time`, `total_time`)".
|
|
|
|
"VALUES (%u, NOW(), %u, %u, %u, %u)",
|
|
|
|
$site_health['id'],
|
|
|
|
$parms['_timings']['fetch'],
|
|
|
|
$parms['_timings']['scrape'],
|
|
|
|
$photo_time,
|
|
|
|
$time
|
|
|
|
);
|
|
|
|
|
|
|
|
return $status;
|
2014-07-01 03:27:56 +02:00
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
function nuke_record($url) {
|
|
|
|
|
|
|
|
$nurl = str_replace(array('https:','//www.'), array('http:','//'), $url);
|
|
|
|
|
|
|
|
$r = q("SELECT `id` FROM `profile` WHERE ( `homepage` = '%s' OR `nurl` = '%s' ) ",
|
|
|
|
dbesc($url),
|
|
|
|
dbesc($nurl)
|
|
|
|
);
|
|
|
|
|
|
|
|
if(count($r)) {
|
|
|
|
foreach($r as $rr) {
|
|
|
|
q("DELETE FROM `photo` WHERE `profile-id` = %d LIMIT 1",
|
|
|
|
intval($rr['id'])
|
|
|
|
);
|
|
|
|
q("DELETE FROM `profile` WHERE `id` = %d LIMIT 1",
|
|
|
|
intval($rr['id'])
|
|
|
|
);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return;
|
2017-03-01 20:19:12 +01:00
|
|
|
}
|