2015-07-24 19:02:42 +02:00
< ? php
/*
* Name : Language Filter
* Version : 0.1
* Description : Filters out postings in languages not spoken by the users
* Author : Tobias Diekershoff < https :// f . diekershoff . de / u / tobias >
* License : MIT
*/
2017-11-05 08:59:45 -05:00
use Friendica\App ;
2018-04-21 18:47:18 -04:00
use Friendica\Content\Text\BBCode ;
2018-12-26 02:28:16 -05:00
use Friendica\Core\Hook ;
2018-10-31 10:55:15 -04:00
use Friendica\Core\Renderer ;
2019-12-16 01:05:14 +01:00
use Friendica\DI ;
2017-10-05 14:58:44 +02:00
2015-07-24 19:02:42 +02:00
/* Define the hooks we want to use
* that is , we have settings , we need to save the settings and we want
* to modify the content of a posting when friendica prepares it .
*/
2017-11-05 08:59:45 -05:00
function langfilter_install ()
{
2018-12-26 02:28:16 -05:00
Hook :: register ( 'prepare_body_content_filter' , 'addon/langfilter/langfilter.php' , 'langfilter_prepare_body_content_filter' , 10 );
Hook :: register ( 'addon_settings' , 'addon/langfilter/langfilter.php' , 'langfilter_addon_settings' );
Hook :: register ( 'addon_settings_post' , 'addon/langfilter/langfilter.php' , 'langfilter_addon_settings_post' );
2015-07-24 19:02:42 +02:00
}
2017-11-05 08:59:45 -05:00
2015-07-24 19:02:42 +02:00
/* The settings
* 1 st check if somebody logged in is calling
* 2 nd get the current settings
* 3 rd parse a SMARTY3 template , replacing some translateable strings for the form
*/
2017-11-05 08:59:45 -05:00
2021-11-20 04:56:55 -05:00
function langfilter_addon_settings ( App $a , array & $data )
2017-11-05 08:59:45 -05:00
{
if ( ! local_user ()) {
2015-07-24 19:02:42 +02:00
return ;
2017-11-05 08:59:45 -05:00
}
2020-02-01 14:14:22 -05:00
$enabled = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'enable' ,
! DI :: pConfig () -> get ( local_user (), 'langfilter' , 'disable' ));
2021-11-20 04:56:55 -05:00
$languages = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'languages' );
$minconfidence = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'minconfidence' , 0 ) * 100 ;
$minlength = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'minlength' , 32 );
2015-07-24 19:02:42 +02:00
2021-11-20 04:56:55 -05:00
$t = Renderer :: getMarkupTemplate ( 'settings.tpl' , 'addon/langfilter/' );
$html = Renderer :: replaceMacros ( $t , [
2021-03-24 23:33:42 +01:00
'$intro' => DI :: l10n () -> t ( 'This addon tries to identify the language posts are written in. If it does not match any language specified below, posts will be hidden by collapsing them.' ),
2021-11-20 04:56:55 -05:00
'$enabled' => [ 'langfilter_enable' , DI :: l10n () -> t ( 'Use the language filter' ), $enabled ],
2020-10-03 22:02:05 -04:00
'$languages' => [ 'langfilter_languages' , DI :: l10n () -> t ( 'Able to read' ), $languages , DI :: l10n () -> t ( 'List of abbreviations (ISO 639-1 codes) for languages you speak, comma separated. For example "de,it".' )],
2020-01-18 20:52:33 +01:00
'$minconfidence' => [ 'langfilter_minconfidence' , DI :: l10n () -> t ( 'Minimum confidence in language detection' ), $minconfidence , DI :: l10n () -> t ( 'Minimum confidence in language detection being correct, from 0 to 100. Posts will not be filtered when the confidence of language detection is below this percent value.' )],
'$minlength' => [ 'langfilter_minlength' , DI :: l10n () -> t ( 'Minimum length of message body' ), $minlength , DI :: l10n () -> t ( 'Minimum number of characters in message body for filter to be used. Posts shorter than this will not be filtered. Note: Language detection is unreliable for short content (<200 characters).' )],
2018-01-15 08:15:33 -05:00
]);
2015-07-24 19:02:42 +02:00
2021-11-20 04:56:55 -05:00
$data = [
'addon' => 'langfilter' ,
'title' => DI :: l10n () -> t ( 'Language Filter' ),
'html' => $html ,
'submit' => [ 'langfilter-settings-submit' => DI :: l10n () -> t ( 'Save Settings' )],
];
2015-07-24 19:02:42 +02:00
}
2017-11-05 08:59:45 -05:00
2015-07-24 19:02:42 +02:00
/* Save the settings
* 1 st check it ' s a logged in user calling
* 2 nd check the langfilter form is to be saved
* 3 rd save the settings to the DB for later usage
*/
2017-11-05 08:59:45 -05:00
function langfilter_addon_settings_post ( App $a , & $b )
{
if ( ! local_user ()) {
2015-07-24 19:02:42 +02:00
return ;
2017-11-05 08:59:45 -05:00
}
2015-07-24 19:02:42 +02:00
2018-08-08 06:24:47 +00:00
if ( ! empty ( $_POST [ 'langfilter-settings-submit' ])) {
2020-02-01 14:14:22 -05:00
$enable = intval ( $_POST [ 'langfilter_enable' ] ? ? 0 );
$languages = trim ( $_POST [ 'langfilter_languages' ] ? ? '' );
$minconfidence = max ( 0 , min ( 100 , intval ( $_POST [ 'langfilter_minconfidence' ] ? ? 0 ))) / 100 ;
$minlength = intval ( $_POST [ 'langfilter_minlength' ] ? ? 32 );
if ( $minlength <= 0 ) {
2017-11-05 08:59:45 -05:00
$minlength = 32 ;
}
2020-02-01 14:14:22 -05:00
DI :: pConfig () -> set ( local_user (), 'langfilter' , 'enable' , $enable );
DI :: pConfig () -> set ( local_user (), 'langfilter' , 'languages' , $languages );
DI :: pConfig () -> set ( local_user (), 'langfilter' , 'minconfidence' , $minconfidence );
DI :: pConfig () -> set ( local_user (), 'langfilter' , 'minlength' , $minlength );
2015-07-24 19:02:42 +02:00
}
}
2017-11-05 08:59:45 -05:00
2015-07-24 19:02:42 +02:00
/* Actually filter postings by their language
* 1 st check if the user wants to filter postings
* 2 nd get the user settings which languages shall be not filtered out
2015-09-22 12:29:06 +02:00
* 3 rd extract the language of a posting
2015-07-24 19:02:42 +02:00
* 4 th if the determined language does not fit to the spoken languages
* of the user , then collapse the posting , but provide a link to
* expand it again .
*/
2018-04-04 22:51:44 -04:00
function langfilter_prepare_body_content_filter ( App $a , & $hook_data )
2017-11-05 08:59:45 -05:00
{
$logged_user = local_user ();
if ( ! $logged_user ) {
return ;
}
2015-09-09 19:41:38 +02:00
2017-11-05 08:59:45 -05:00
// Never filter own messages
// TODO: find a better way to extract this
2021-08-09 19:49:06 +00:00
$logged_user_profile = DI :: baseUrl () -> get () . '/profile/' . $a -> getLoggedInUserNickname ();
2018-04-01 02:31:37 -04:00
if ( $logged_user_profile == $hook_data [ 'item' ][ 'author-link' ]) {
2017-11-05 08:59:45 -05:00
return ;
}
2015-07-24 19:02:42 +02:00
2017-11-05 08:59:45 -05:00
// Don't filter if language filter is disabled
2020-02-01 14:14:22 -05:00
if ( ! DI :: pConfig () -> get ( $logged_user , 'langfilter' , 'enable' ,
! DI :: pConfig () -> get ( $logged_user , 'langfilter' , 'disable' ))
) {
2017-11-05 08:59:45 -05:00
return ;
}
2015-09-10 09:54:26 +02:00
2022-01-19 09:49:56 -05:00
$naked_body = strip_tags (
$hook_data [ 'item' ][ 'rendered-html' ]
? ? '' ? : // Equivalent of !empty()
2022-01-20 09:23:31 -05:00
BBCode :: convert ( $hook_data [ 'item' ][ 'body' ], false , BBCode :: ACTIVITYPUB , true )
2022-01-19 09:49:56 -05:00
);
$naked_body = preg_replace ( '#\s+#' , ' ' , trim ( $naked_body ));
2018-04-21 04:13:53 -04:00
2017-11-05 08:59:45 -05:00
// Don't filter if body lenght is below minimum
2020-01-18 16:50:56 +01:00
$minlen = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'minlength' , 32 );
2017-11-05 08:59:45 -05:00
if ( ! $minlen ) {
$minlen = 32 ;
}
2018-04-21 04:13:53 -04:00
if ( strlen ( $naked_body ) < $minlen ) {
2017-11-05 08:59:45 -05:00
return ;
}
2016-10-01 18:15:32 +02:00
2020-01-18 16:50:56 +01:00
$read_languages_string = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'languages' );
$minconfidence = DI :: pConfig () -> get ( local_user (), 'langfilter' , 'minconfidence' );
2015-09-22 12:29:06 +02:00
2017-11-05 08:59:45 -05:00
// Don't filter if no spoken languages are configured
2018-04-01 02:31:37 -04:00
if ( ! $read_languages_string ) {
2017-11-05 08:59:45 -05:00
return ;
2018-04-01 02:31:37 -04:00
}
$read_languages_array = explode ( ',' , $read_languages_string );
2015-09-22 12:29:06 +02:00
2020-10-03 22:00:44 -04:00
$iso639 = new Matriphe\ISO639\ISO639 ;
2017-11-05 08:59:45 -05:00
// Extract the language of the post
2018-06-30 05:20:17 +00:00
if ( ! empty ( $hook_data [ 'item' ][ 'language' ])) {
$languages = json_decode ( $hook_data [ 'item' ][ 'language' ], true );
if ( ! is_array ( $languages )) {
return ;
}
2018-04-01 02:31:37 -04:00
2018-06-30 05:20:17 +00:00
foreach ( $languages as $iso2 => $confidence ) {
break ;
}
2015-09-22 12:29:06 +02:00
2018-08-31 05:10:53 +00:00
if ( empty ( $iso2 )) {
return ;
}
2020-10-03 22:00:44 -04:00
$lang = $iso639 -> languageByCode1 ( $iso2 );
2018-06-30 05:20:17 +00:00
} else {
$opts = $hook_data [ 'item' ][ 'postopts' ];
if ( ! $opts ) {
// no options associated to post
return ;
}
if ( ! preg_match ( '/\blang=([^;]*);([^:]*)/' , $opts , $matches )) {
// no lang options associated to post
return ;
}
$lang = $matches [ 1 ];
$confidence = $matches [ 2 ];
2020-10-03 22:00:44 -04:00
$iso2 = $iso639 -> code1ByLanguage ( $lang );
2018-06-30 05:20:17 +00:00
}
2015-09-22 12:29:06 +02:00
2017-11-05 08:59:45 -05:00
// Do not filter if language detection confidence is too low
if ( $minconfidence && $confidence < $minconfidence ) {
return ;
}
2015-09-22 12:29:06 +02:00
2017-11-05 08:59:45 -05:00
if ( ! $iso2 ) {
return ;
}
2015-09-22 12:29:06 +02:00
2018-04-01 02:31:37 -04:00
if ( ! in_array ( $iso2 , $read_languages_array )) {
2020-01-18 20:52:33 +01:00
$hook_data [ 'filter_reasons' ][] = DI :: l10n () -> t ( 'Filtered language: %s' , ucfirst ( $lang ));
2017-11-05 08:59:45 -05:00
}
2015-07-24 19:02:42 +02:00
}