Merge pull request #13856 from annando/spam2

Compare lengths of hashtags with the content length for improved spam detection
This commit is contained in:
Hypolite Petovan 2024-01-26 18:59:38 -05:00 committed by GitHub
commit 9e738253e7
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
2 changed files with 10 additions and 5 deletions

View file

@ -113,13 +113,18 @@ class Relay
}
if (!empty($tagList) || !empty($denyTags)) {
$content = mb_strtolower(BBCode::toPlaintext($body, false));
$max_tags = $config->get('system', 'relay_max_tags');
if ($max_tags && (count($tags) > $max_tags) && preg_match('/[^@!#]\[url\=.*?\].*?\[\/url\]/ism', $body)) {
Logger::info('Possible hashtag spam detected - rejected', ['hashtags' => $tags, 'network' => $network, 'url' => $url, 'causer' => $causer, 'body' => $body]);
return false;
}
$cleaned = preg_replace('/[@!#]\[url\=.*?\].*?\[\/url\]/ism', '', $body);
$content_cleaned = mb_strtolower(BBCode::toPlaintext($cleaned, false));
$content = mb_strtolower(BBCode::toPlaintext($body, false));
if (strlen($content_cleaned) < strlen($content) / 2) {
Logger::info('Possible hashtag spam detected - rejected', ['hashtags' => $tags, 'network' => $network, 'url' => $url, 'causer' => $causer, 'body' => $body]);
return false;
}
}
foreach ($tags as $tag) {
$tag = mb_strtolower($tag);

View file

@ -239,7 +239,7 @@ return [
// relay_max_tags (Integer)
// Maximum amount of tags in a post before it is rejected as spam.
'relay_max_tags' => 10,
'relay_max_tags' => 20,
// proxify_content (Boolean)
// Use the proxy functionality for fetching external content