2018-11-12 03:08:33 +01:00
|
|
|
<?php
|
|
|
|
|
|
|
|
namespace Friendica\Directory\Pollers;
|
|
|
|
|
2018-11-13 03:50:50 +01:00
|
|
|
use Friendica\Directory\Utils\Network;
|
|
|
|
|
2018-11-12 03:08:33 +01:00
|
|
|
/**
|
2020-06-13 19:15:53 +02:00
|
|
|
* @author Hypolite Petovan <hypolite@mrpetovan.com>
|
2018-11-12 03:08:33 +01:00
|
|
|
*/
|
|
|
|
class Profile
|
|
|
|
{
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @var \Atlas\Pdo\Connection
|
|
|
|
*/
|
|
|
|
private $atlas;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @var \Friendica\Directory\Models\Server
|
|
|
|
*/
|
|
|
|
private $serverModel;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @var \Friendica\Directory\Models\Profile
|
|
|
|
*/
|
|
|
|
private $profileModel;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @var \Psr\Log\LoggerInterface
|
|
|
|
*/
|
|
|
|
private $logger;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @var array
|
|
|
|
*/
|
|
|
|
private $settings = [
|
|
|
|
'probe_timeout' => 5,
|
|
|
|
'remove_profile_health_threshold' => -60
|
|
|
|
];
|
|
|
|
|
|
|
|
public function __construct(
|
|
|
|
\Atlas\Pdo\Connection $atlas,
|
|
|
|
\Friendica\Directory\Models\Server $serverModel,
|
|
|
|
\Friendica\Directory\Models\Profile $profileModel,
|
|
|
|
\Psr\Log\LoggerInterface $logger,
|
|
|
|
array $settings
|
|
|
|
)
|
|
|
|
{
|
|
|
|
$this->atlas = $atlas;
|
|
|
|
$this->serverModel = $serverModel;
|
|
|
|
$this->profileModel = $profileModel;
|
|
|
|
$this->logger = $logger;
|
|
|
|
$this->settings = array_merge($this->settings, $settings);
|
|
|
|
}
|
|
|
|
|
|
|
|
public function __invoke(string $profile_uri)
|
|
|
|
{
|
|
|
|
if (!strlen($profile_uri)) {
|
|
|
|
$this->logger->error('Received empty profile URI', ['class' => __CLASS__]);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
$submit_start = microtime(true);
|
|
|
|
|
|
|
|
$this->logger->info('Poll profile URI: ' . $profile_uri);
|
|
|
|
|
|
|
|
$host = parse_url($profile_uri, PHP_URL_HOST);
|
|
|
|
|
|
|
|
if (!$host) {
|
|
|
|
$this->logger->warning('Missing hostname in polled profile URL: ' . $profile_uri);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!\Friendica\Directory\Utils\Network::isPublicHost($host)) {
|
|
|
|
$this->logger->warning('Private/reserved IP in polled profile URL: ' . $profile_uri);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
$profileUriInfo = \Friendica\Directory\Models\Profile::extractInfoFromProfileUrl($profile_uri);
|
|
|
|
if (!$profileUriInfo) {
|
|
|
|
$this->logger->warning('Profile URI invalid');
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
$server = $this->serverModel->getByUrlAlias($profileUriInfo['server_uri']);
|
|
|
|
if (!$server) {
|
|
|
|
$this->atlas->perform('INSERT IGNORE INTO `server_poll_queue` SET `base_url` = :base_url', ['base_url' => $profileUriInfo['server_uri']]);
|
|
|
|
|
|
|
|
// No server entry yet, no need to continue.
|
|
|
|
$this->logger->info('Profile poll aborted, no server entry yet for ' . $profileUriInfo['server_uri']);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($server['hidden']) {
|
|
|
|
$this->logger->info('Profile poll aborted, server is hidden: ' . $server['base_url']);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
$username = $profileUriInfo['username'];
|
|
|
|
$addr = $profileUriInfo['addr'];
|
|
|
|
|
|
|
|
$profile_id = $this->atlas->fetchValue(
|
|
|
|
'SELECT `id` FROM `profile` WHERE `server_id` = :server_id AND `username` = :username',
|
|
|
|
['server_id' => $server['id'], 'username' => $username]
|
|
|
|
);
|
|
|
|
|
|
|
|
if ($profile_id) {
|
|
|
|
$this->atlas->perform(
|
|
|
|
'UPDATE `profile` SET
|
|
|
|
`available` = 0,
|
|
|
|
`updated` = NOW()
|
|
|
|
WHERE `id` = :profile_id',
|
|
|
|
['profile_id' => [$profile_id, \PDO::PARAM_INT]]
|
|
|
|
);
|
|
|
|
|
|
|
|
$this->atlas->perform(
|
|
|
|
'DELETE FROM `tag` WHERE `profile_id` = :profile_id',
|
|
|
|
['profile_id' => [$profile_id, \PDO::PARAM_INT]]
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
//Skip the profile scrape?
|
|
|
|
$noscrape = $server['noscrape_url'];
|
|
|
|
|
|
|
|
$params = [];
|
|
|
|
if ($noscrape) {
|
|
|
|
$this->logger->debug('Calling ' . $server['noscrape_url'] . '/' . $username);
|
|
|
|
$params = \Friendica\Directory\Utils\Scrape::retrieveNoScrapeData($server['noscrape_url'] . '/' . $username);
|
|
|
|
$noscrape = !!$params; //If the result was false, do a scrape after all.
|
|
|
|
}
|
|
|
|
|
2018-11-13 03:50:50 +01:00
|
|
|
$available = true;
|
|
|
|
|
|
|
|
if ($noscrape) {
|
|
|
|
$available = Network::testURL($profile_uri);
|
|
|
|
$this->logger->debug('Testing ' . $profile_uri . ': ' . ($available?'Success':'Failure'));
|
|
|
|
} else {
|
2018-11-12 03:08:33 +01:00
|
|
|
$this->logger->notice('Parsing profile page ' . $profile_uri);
|
|
|
|
$params = \Friendica\Directory\Utils\Scrape::retrieveProfileData($profile_uri);
|
2018-11-16 05:32:52 +01:00
|
|
|
$params['language'] = $server['language'];
|
2018-11-12 03:08:33 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// Empty result is due to an offline site.
|
|
|
|
if (count($params) < 2) {
|
|
|
|
//But for sites that are already in bad status. Do a cleanup now.
|
|
|
|
if ($profile_id && $server['health_score'] < $this->settings['remove_profile_health_threshold']) {
|
|
|
|
$this->profileModel->deleteById($profile_id);
|
|
|
|
}
|
|
|
|
|
|
|
|
$this->logger->info('Poll aborted, empty result');
|
|
|
|
return false;
|
|
|
|
} elseif (!empty($params['explicit-hide']) && $profile_id) {
|
|
|
|
// We don't care about valid dfrn if the user indicates to be hidden.
|
|
|
|
$this->profileModel->deleteById($profile_id);
|
|
|
|
$this->logger->info('Poll aborted, profile asked to be removed from directory');
|
|
|
|
return true; //This is a good update.
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!empty($params['hide']) || empty($params['fn']) || empty($params['photo'])) {
|
|
|
|
if ($profile_id) {
|
|
|
|
$this->profileModel->deleteById($profile_id);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!empty($params['hide'])) {
|
|
|
|
$this->logger->info('Poll aborted, hidden profile.');
|
|
|
|
} else {
|
|
|
|
$this->logger->info('Poll aborted, incomplete profile.');
|
|
|
|
}
|
|
|
|
|
|
|
|
return true; //This is a good update.
|
|
|
|
}
|
|
|
|
|
|
|
|
// This is most likely a problem with the site configuration. Ignore.
|
|
|
|
if (self::validateParams($params)) {
|
|
|
|
$this->logger->warning('Poll aborted, parameters invalid.', ['params' => $params]);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
$account_type = 'People';
|
|
|
|
if (!empty($params['comm'])) {
|
|
|
|
$account_type = 'Forum';
|
|
|
|
}
|
|
|
|
|
|
|
|
$tags = [];
|
|
|
|
if (!empty($params['tags'])) {
|
|
|
|
$incoming_tags = explode(' ', $params['tags']);
|
|
|
|
foreach ($incoming_tags as $term) {
|
|
|
|
$term = strip_tags(trim($term));
|
|
|
|
$term = substr($term, 0, 254);
|
|
|
|
|
|
|
|
$tags[] = $term;
|
|
|
|
}
|
|
|
|
|
|
|
|
$tags = array_unique($tags);
|
|
|
|
}
|
|
|
|
|
|
|
|
$filled_fields = intval(!empty($params['pdesc'])) * 4 + intval(!empty($params['tags'])) * 2 + intval(!empty($params['locality']) || !empty($params['region']) || !empty($params['country-name']));
|
|
|
|
|
2018-11-16 05:32:52 +01:00
|
|
|
$this->logger->debug(var_export($params, true));
|
|
|
|
|
|
|
|
$values = [
|
|
|
|
'profile_id' => $profile_id,
|
|
|
|
'server_id' => $server['id'],
|
|
|
|
'username' => $username,
|
|
|
|
'name' => $params['fn'],
|
|
|
|
'pdesc' => $params['pdesc'] ?? '',
|
|
|
|
'locality' => $params['locality'] ?? '',
|
|
|
|
'region' => $params['region'] ?? '',
|
|
|
|
'country' => $params['country-name'] ?? '',
|
|
|
|
'profile_url' => $profile_uri,
|
|
|
|
'dfrn_request' => $params['dfrn-request'] ?? null,
|
|
|
|
'photo' => $params['photo'],
|
|
|
|
'tags' => implode(' ', $tags),
|
|
|
|
'addr' => $addr,
|
|
|
|
'account_type' => $account_type,
|
|
|
|
'language' => $params['language'] ?? null,
|
|
|
|
'filled_fields'=> $filled_fields,
|
|
|
|
'last_activity'=> $params['last-activity'] ?? null,
|
|
|
|
'available' => $available,
|
|
|
|
];
|
|
|
|
|
|
|
|
$this->logger->debug(var_export($values, true));
|
|
|
|
|
2018-11-12 03:08:33 +01:00
|
|
|
$this->atlas->perform('INSERT INTO `profile` SET
|
2018-11-16 05:32:52 +01:00
|
|
|
`server_id` = :server_id,
|
|
|
|
`username` = :username,
|
|
|
|
`name` = :name,
|
|
|
|
`pdesc` = :pdesc,
|
|
|
|
`locality` = :locality,
|
|
|
|
`region` = :region,
|
|
|
|
`country` = :country,
|
|
|
|
`profile_url` = :profile_url,
|
|
|
|
`dfrn_request` = :dfrn_request,
|
|
|
|
`photo` = :photo,
|
|
|
|
`tags` = :tags,
|
|
|
|
`addr` = :addr,
|
|
|
|
`account_type` = :account_type,
|
|
|
|
`language` = :language,
|
2018-11-12 03:08:33 +01:00
|
|
|
`filled_fields` = :filled_fields,
|
|
|
|
`last_activity` = :last_activity,
|
2018-11-16 05:32:52 +01:00
|
|
|
`available` = :available,
|
2018-11-12 03:08:33 +01:00
|
|
|
`created` = NOW(),
|
|
|
|
`updated` = NOW()
|
|
|
|
ON DUPLICATE KEY UPDATE
|
2018-11-16 05:32:52 +01:00
|
|
|
`server_id` = :server_id,
|
|
|
|
`username` = :username,
|
|
|
|
`name` = :name,
|
|
|
|
`pdesc` = :pdesc,
|
|
|
|
`locality` = :locality,
|
|
|
|
`region` = :region,
|
|
|
|
`country` = :country,
|
|
|
|
`profile_url` = :profile_url,
|
|
|
|
`dfrn_request` = :dfrn_request,
|
|
|
|
`photo` = :photo,
|
|
|
|
`tags` = :tags,
|
|
|
|
`addr` = :addr,
|
|
|
|
`account_type` = :account_type,
|
|
|
|
`language` = :language,
|
2018-11-12 03:08:33 +01:00
|
|
|
`filled_fields` = :filled_fields,
|
|
|
|
`last_activity` = :last_activity,
|
2018-11-16 05:32:52 +01:00
|
|
|
`available` = :available,
|
|
|
|
`updated` = NOW()',
|
|
|
|
$values
|
2018-11-12 03:08:33 +01:00
|
|
|
);
|
|
|
|
|
|
|
|
if (!$profile_id) {
|
|
|
|
$profile_id = $this->atlas->lastInsertId();
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!empty($params['tags'])) {
|
|
|
|
$incoming_tags = explode(' ', $params['tags']);
|
|
|
|
foreach ($incoming_tags as $term) {
|
|
|
|
$term = strip_tags(trim($term));
|
|
|
|
$term = substr($term, 0, 254);
|
|
|
|
|
|
|
|
if (strlen($term)) {
|
|
|
|
$this->atlas->perform('INSERT IGNORE INTO `tag` (`profile_id`, `term`) VALUES (:profile_id, :term)', ['term' => $term, 'profile_id' => $profile_id]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
$submit_photo_start = microtime(true);
|
|
|
|
|
|
|
|
$status = false;
|
|
|
|
|
|
|
|
if ($profile_id) {
|
|
|
|
$img_str = \Friendica\Directory\Utils\Network::fetchURL($params['photo'], true);
|
|
|
|
$img = new \Friendica\Directory\Utils\Photo($img_str);
|
|
|
|
if ($img->getImage()) {
|
|
|
|
$img->scaleImageSquare(80);
|
|
|
|
|
|
|
|
$this->atlas->perform('INSERT INTO `photo` SET
|
|
|
|
`profile_id` = :profile_id,
|
|
|
|
`data` = :data
|
|
|
|
ON DUPLICATE KEY UPDATE
|
|
|
|
`data` = :data',
|
|
|
|
[
|
|
|
|
'profile_id' => $profile_id,
|
|
|
|
'data' => $img->imageString()
|
|
|
|
]
|
|
|
|
);
|
|
|
|
}
|
|
|
|
$status = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
$submit_end = microtime(true);
|
|
|
|
$photo_time = round(($submit_end - $submit_photo_start) * 1000);
|
|
|
|
$time = round(($submit_end - $submit_start) * 1000);
|
|
|
|
|
|
|
|
//Record the scrape speed in a scrapes table.
|
|
|
|
if ($server && $status) {
|
|
|
|
$this->atlas->perform('INSERT INTO `site_scrape` SET
|
|
|
|
`server_id` = :server_id,
|
|
|
|
`request_time` = :request_time,
|
|
|
|
`scrape_time` = :scrape_time,
|
|
|
|
`photo_time` = :photo_time,
|
|
|
|
`total_time` = :total_time',
|
|
|
|
[
|
|
|
|
'server_id' => $server['id'],
|
|
|
|
'request_time' => $params['_timings']['fetch'],
|
|
|
|
'scrape_time' => $params['_timings']['scrape'],
|
|
|
|
'photo_time' => $photo_time,
|
|
|
|
'total_time' => $time
|
|
|
|
]
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
$this->logger->info('Profile poll successful');
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
private static function validateParams(array $params): int
|
|
|
|
{
|
|
|
|
$errors = 0;
|
|
|
|
if (empty($params['key'])) {
|
|
|
|
$errors++;
|
|
|
|
}
|
|
|
|
if (empty($params['dfrn-request'])) {
|
|
|
|
$errors++;
|
|
|
|
}
|
|
|
|
if (empty($params['dfrn-confirm'])) {
|
|
|
|
$errors++;
|
|
|
|
}
|
|
|
|
if (empty($params['dfrn-notify'])) {
|
|
|
|
$errors++;
|
|
|
|
}
|
|
|
|
if (empty($params['dfrn-poll'])) {
|
|
|
|
$errors++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return $errors;
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|