2015-07-24 19:02:42 +02:00
< ? php
/*
* Name : Language Filter
* Version : 0.1
* Description : Filters out postings in languages not spoken by the users
* Author : Tobias Diekershoff < https :// f . diekershoff . de / u / tobias >
* License : MIT
*/
2017-11-05 14:59:45 +01:00
use Friendica\App ;
2018-04-22 00:47:18 +02:00
use Friendica\Content\Text\BBCode ;
2018-12-26 08:28:16 +01:00
use Friendica\Core\Hook ;
2018-10-31 15:55:15 +01:00
use Friendica\Core\Renderer ;
2019-12-16 01:05:14 +01:00
use Friendica\DI ;
2017-10-05 14:58:44 +02:00
2015-07-24 19:02:42 +02:00
/* Define the hooks we want to use
* that is , we have settings , we need to save the settings and we want
* to modify the content of a posting when friendica prepares it .
*/
2017-11-05 14:59:45 +01:00
function langfilter_install ()
{
2018-12-26 08:28:16 +01:00
Hook :: register ( 'prepare_body_content_filter' , 'addon/langfilter/langfilter.php' , 'langfilter_prepare_body_content_filter' , 10 );
Hook :: register ( 'addon_settings' , 'addon/langfilter/langfilter.php' , 'langfilter_addon_settings' );
Hook :: register ( 'addon_settings_post' , 'addon/langfilter/langfilter.php' , 'langfilter_addon_settings_post' );
2015-07-24 19:02:42 +02:00
}
2017-11-05 14:59:45 +01:00
2015-07-24 19:02:42 +02:00
/* The settings
* 1 st check if somebody logged in is calling
* 2 nd get the current settings
* 3 rd parse a SMARTY3 template , replacing some translateable strings for the form
*/
2017-11-05 14:59:45 +01:00
function langfilter_addon_settings ( App $a , & $s )
{
if ( ! local_user ()) {
2015-07-24 19:02:42 +02:00
return ;
2017-11-05 14:59:45 +01:00
}
2020-02-01 20:14:22 +01:00
$enabled = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'enable' ,
! DI :: pConfig () -> get ( local_user (), 'langfilter' , 'disable' ));
$enable_checked = $enabled ? ' checked="checked"' : '' ;
2020-01-18 16:50:56 +01:00
$languages = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'languages' );
2020-02-01 20:14:22 +01:00
$minconfidence = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'minconfidence' , 0 ) * 100 ;
$minlength = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'minlength' , 32 );
2015-07-24 19:02:42 +02:00
2018-10-31 15:55:15 +01:00
$t = Renderer :: getMarkupTemplate ( " settings.tpl " , " addon/langfilter/ " );
$s .= Renderer :: replaceMacros ( $t , [
2020-01-18 20:52:33 +01:00
'$title' => DI :: l10n () -> t ( " Language Filter " ),
2021-03-24 23:33:42 +01:00
'$intro' => DI :: l10n () -> t ( 'This addon tries to identify the language posts are written in. If it does not match any language specified below, posts will be hidden by collapsing them.' ),
2020-01-18 20:52:33 +01:00
'$enabled' => [ 'langfilter_enable' , DI :: l10n () -> t ( 'Use the language filter' ), $enable_checked , '' ],
2020-10-04 04:02:05 +02:00
'$languages' => [ 'langfilter_languages' , DI :: l10n () -> t ( 'Able to read' ), $languages , DI :: l10n () -> t ( 'List of abbreviations (ISO 639-1 codes) for languages you speak, comma separated. For example "de,it".' )],
2020-01-18 20:52:33 +01:00
'$minconfidence' => [ 'langfilter_minconfidence' , DI :: l10n () -> t ( 'Minimum confidence in language detection' ), $minconfidence , DI :: l10n () -> t ( 'Minimum confidence in language detection being correct, from 0 to 100. Posts will not be filtered when the confidence of language detection is below this percent value.' )],
'$minlength' => [ 'langfilter_minlength' , DI :: l10n () -> t ( 'Minimum length of message body' ), $minlength , DI :: l10n () -> t ( 'Minimum number of characters in message body for filter to be used. Posts shorter than this will not be filtered. Note: Language detection is unreliable for short content (<200 characters).' )],
'$submit' => DI :: l10n () -> t ( 'Save Settings' ),
2018-01-15 14:15:33 +01:00
]);
2015-07-24 19:02:42 +02:00
return ;
}
2017-11-05 14:59:45 +01:00
2015-07-24 19:02:42 +02:00
/* Save the settings
* 1 st check it ' s a logged in user calling
* 2 nd check the langfilter form is to be saved
* 3 rd save the settings to the DB for later usage
*/
2017-11-05 14:59:45 +01:00
function langfilter_addon_settings_post ( App $a , & $b )
{
if ( ! local_user ()) {
2015-07-24 19:02:42 +02:00
return ;
2017-11-05 14:59:45 +01:00
}
2015-07-24 19:02:42 +02:00
2018-08-08 08:24:47 +02:00
if ( ! empty ( $_POST [ 'langfilter-settings-submit' ])) {
2020-02-01 20:14:22 +01:00
$enable = intval ( $_POST [ 'langfilter_enable' ] ? ? 0 );
$languages = trim ( $_POST [ 'langfilter_languages' ] ? ? '' );
$minconfidence = max ( 0 , min ( 100 , intval ( $_POST [ 'langfilter_minconfidence' ] ? ? 0 ))) / 100 ;
$minlength = intval ( $_POST [ 'langfilter_minlength' ] ? ? 32 );
if ( $minlength <= 0 ) {
2017-11-05 14:59:45 +01:00
$minlength = 32 ;
}
2020-02-01 20:14:22 +01:00
DI :: pConfig () -> set ( local_user (), 'langfilter' , 'enable' , $enable );
DI :: pConfig () -> set ( local_user (), 'langfilter' , 'languages' , $languages );
DI :: pConfig () -> set ( local_user (), 'langfilter' , 'minconfidence' , $minconfidence );
DI :: pConfig () -> set ( local_user (), 'langfilter' , 'minlength' , $minlength );
2015-07-24 19:02:42 +02:00
}
}
2017-11-05 14:59:45 +01:00
2015-07-24 19:02:42 +02:00
/* Actually filter postings by their language
* 1 st check if the user wants to filter postings
* 2 nd get the user settings which languages shall be not filtered out
2015-09-22 12:29:06 +02:00
* 3 rd extract the language of a posting
2015-07-24 19:02:42 +02:00
* 4 th if the determined language does not fit to the spoken languages
* of the user , then collapse the posting , but provide a link to
* expand it again .
*/
2018-04-05 04:51:44 +02:00
function langfilter_prepare_body_content_filter ( App $a , & $hook_data )
2017-11-05 14:59:45 +01:00
{
$logged_user = local_user ();
if ( ! $logged_user ) {
return ;
}
2015-09-09 19:41:38 +02:00
2017-11-05 14:59:45 +01:00
// Never filter own messages
// TODO: find a better way to extract this
2019-12-16 01:05:14 +01:00
$logged_user_profile = DI :: baseUrl () -> get () . '/profile/' . $a -> user [ 'nickname' ];
2018-04-01 08:31:37 +02:00
if ( $logged_user_profile == $hook_data [ 'item' ][ 'author-link' ]) {
2017-11-05 14:59:45 +01:00
return ;
}
2015-07-24 19:02:42 +02:00
2017-11-05 14:59:45 +01:00
// Don't filter if language filter is disabled
2020-02-01 20:14:22 +01:00
if ( ! DI :: pConfig () -> get ( $logged_user , 'langfilter' , 'enable' ,
! DI :: pConfig () -> get ( $logged_user , 'langfilter' , 'disable' ))
) {
2017-11-05 14:59:45 +01:00
return ;
}
2015-09-10 09:54:26 +02:00
2021-07-18 01:36:23 +02:00
if ( ! empty ( $hook_data [ 'item' ][ 'rendered-html' ])) {
$naked_body = strip_tags ( $hook_data [ 'item' ][ 'rendered-html' ]);
} else {
$naked_body = BBCode :: toPlaintext ( $hook_data [ 'item' ][ 'body' ], false );
}
2018-04-21 10:13:53 +02:00
2017-11-05 14:59:45 +01:00
// Don't filter if body lenght is below minimum
2020-01-18 16:50:56 +01:00
$minlen = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'minlength' , 32 );
2017-11-05 14:59:45 +01:00
if ( ! $minlen ) {
$minlen = 32 ;
}
2018-04-21 10:13:53 +02:00
if ( strlen ( $naked_body ) < $minlen ) {
2017-11-05 14:59:45 +01:00
return ;
}
2016-10-01 18:15:32 +02:00
2020-01-18 16:50:56 +01:00
$read_languages_string = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'languages' );
$minconfidence = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'minconfidence' );
2015-09-22 12:29:06 +02:00
2017-11-05 14:59:45 +01:00
// Don't filter if no spoken languages are configured
2018-04-01 08:31:37 +02:00
if ( ! $read_languages_string ) {
2017-11-05 14:59:45 +01:00
return ;
2018-04-01 08:31:37 +02:00
}
$read_languages_array = explode ( ',' , $read_languages_string );
2015-09-22 12:29:06 +02:00
2020-10-04 04:00:44 +02:00
$iso639 = new Matriphe\ISO639\ISO639 ;
2017-11-05 14:59:45 +01:00
// Extract the language of the post
2018-06-30 07:20:17 +02:00
if ( ! empty ( $hook_data [ 'item' ][ 'language' ])) {
$languages = json_decode ( $hook_data [ 'item' ][ 'language' ], true );
if ( ! is_array ( $languages )) {
return ;
}
2018-04-01 08:31:37 +02:00
2018-06-30 07:20:17 +02:00
foreach ( $languages as $iso2 => $confidence ) {
break ;
}
2015-09-22 12:29:06 +02:00
2018-08-31 07:10:53 +02:00
if ( empty ( $iso2 )) {
return ;
}
2020-10-04 04:00:44 +02:00
$lang = $iso639 -> languageByCode1 ( $iso2 );
2018-06-30 07:20:17 +02:00
} else {
$opts = $hook_data [ 'item' ][ 'postopts' ];
if ( ! $opts ) {
// no options associated to post
return ;
}
if ( ! preg_match ( '/\blang=([^;]*);([^:]*)/' , $opts , $matches )) {
// no lang options associated to post
return ;
}
$lang = $matches [ 1 ];
$confidence = $matches [ 2 ];
2020-10-04 04:00:44 +02:00
$iso2 = $iso639 -> code1ByLanguage ( $lang );
2018-06-30 07:20:17 +02:00
}
2015-09-22 12:29:06 +02:00
2017-11-05 14:59:45 +01:00
// Do not filter if language detection confidence is too low
if ( $minconfidence && $confidence < $minconfidence ) {
return ;
}
2015-09-22 12:29:06 +02:00
2017-11-05 14:59:45 +01:00
if ( ! $iso2 ) {
return ;
}
2015-09-22 12:29:06 +02:00
2018-04-01 08:31:37 +02:00
if ( ! in_array ( $iso2 , $read_languages_array )) {
2020-01-18 20:52:33 +01:00
$hook_data [ 'filter_reasons' ][] = DI :: l10n () -> t ( 'Filtered language: %s' , ucfirst ( $lang ));
2017-11-05 14:59:45 +01:00
}
2015-07-24 19:02:42 +02:00
}