2015-07-24 13:02:42 -04:00
< ? php
/*
* Name : Language Filter
* Version : 0.1
* Description : Filters out postings in languages not spoken by the users
* Author : Tobias Diekershoff < https :// f . diekershoff . de / u / tobias >
* License : MIT
*/
2017-11-05 08:59:45 -05:00
use Friendica\App ;
2018-04-21 18:47:18 -04:00
use Friendica\Content\Text\BBCode ;
2018-01-16 19:51:12 -05:00
use Friendica\Core\Addon ;
2018-01-22 14:03:11 -05:00
use Friendica\Core\L10n ;
2017-11-05 11:15:34 -05:00
use Friendica\Core\PConfig ;
2017-10-05 08:58:44 -04:00
2015-07-24 13:02:42 -04:00
/* Define the hooks we want to use
* that is , we have settings , we need to save the settings and we want
* to modify the content of a posting when friendica prepares it .
*/
2017-11-05 08:59:45 -05:00
function langfilter_install ()
{
2018-04-04 22:51:44 -04:00
Addon :: registerHook ( 'prepare_body_content_filter' , 'addon/langfilter/langfilter.php' , 'langfilter_prepare_body_content_filter' , 10 );
2018-01-20 08:57:41 -05:00
Addon :: registerHook ( 'addon_settings' , 'addon/langfilter/langfilter.php' , 'langfilter_addon_settings' );
Addon :: registerHook ( 'addon_settings_post' , 'addon/langfilter/langfilter.php' , 'langfilter_addon_settings_post' );
2015-07-24 13:02:42 -04:00
}
2017-11-05 08:59:45 -05:00
function langfilter_uninstall ()
{
2018-04-04 22:51:44 -04:00
Addon :: unregisterHook ( 'prepare_body_content_filter' , 'addon/langfilter/langfilter.php' , 'langfilter_prepare_body_content_filter' );
2018-01-16 19:51:12 -05:00
Addon :: unregisterHook ( 'prepare_body' , 'addon/langfilter/langfilter.php' , 'langfilter_prepare_body' );
2018-01-20 08:57:41 -05:00
Addon :: unregisterHook ( 'addon_settings' , 'addon/langfilter/langfilter.php' , 'langfilter_addon_settings' );
Addon :: unregisterHook ( 'addon_settings_post' , 'addon/langfilter/langfilter.php' , 'langfilter_addon_settings_post' );
2015-07-24 13:02:42 -04:00
}
/* The settings
* 1 st check if somebody logged in is calling
* 2 nd get the current settings
* 3 rd parse a SMARTY3 template , replacing some translateable strings for the form
*/
2017-11-05 08:59:45 -05:00
function langfilter_addon_settings ( App $a , & $s )
{
if ( ! local_user ()) {
2015-07-24 13:02:42 -04:00
return ;
2017-11-05 08:59:45 -05:00
}
2017-11-05 11:15:34 -05:00
$enable_checked = ( intval ( PConfig :: get ( local_user (), 'langfilter' , 'disable' )) ? '' : ' checked="checked" ' );
$languages = PConfig :: get ( local_user (), 'langfilter' , 'languages' );
$minconfidence = PConfig :: get ( local_user (), 'langfilter' , 'minconfidence' ) * 100 ;
$minlength = PConfig :: get ( local_user (), 'langfilter' , 'minlength' );
2015-07-24 13:02:42 -04:00
2017-11-05 08:59:45 -05:00
$t = get_markup_template ( " settings.tpl " , " addon/langfilter/ " );
2018-01-15 08:15:33 -05:00
$s .= replace_macros ( $t , [
2018-01-22 14:03:11 -05:00
'$title' => L10n :: t ( " Language Filter " ),
2018-03-29 11:45:42 -04:00
'$intro' => L10n :: t ( 'This addon tries to identify the language posts are writen in. If it does not match any language specifed below, posts will be hidden by collapsing them.' ),
2018-01-22 14:03:11 -05:00
'$enabled' => [ 'langfilter_enable' , L10n :: t ( 'Use the language filter' ), $enable_checked , '' ],
2018-03-29 09:22:05 -04:00
'$languages' => [ 'langfilter_languages' , L10n :: t ( 'Able to read' ), $languages , L10n :: t ( 'List of abbreviations (iso2 codes) for languages you speak, comma separated. For example "de,it".' )],
2018-01-22 14:03:11 -05:00
'$minconfidence' => [ 'langfilter_minconfidence' , L10n :: t ( 'Minimum confidence in language detection' ), $minconfidence , L10n :: t ( 'Minimum confidence in language detection being correct, from 0 to 100. Posts will not be filtered when the confidence of language detection is below this percent value.' )],
2018-03-29 11:45:42 -04:00
'$minlength' => [ 'langfilter_minlength' , L10n :: t ( 'Minimum length of message body' ), $minlength , L10n :: t ( 'Minimum number of characters in message body for filter to be used. Posts shorter than this will not be filtered. Note: Language detection is unreliable for short content (<200 characters).' )],
2018-01-22 14:03:11 -05:00
'$submit' => L10n :: t ( 'Save Settings' ),
2018-01-15 08:15:33 -05:00
]);
2015-07-24 13:02:42 -04:00
return ;
}
2017-11-05 08:59:45 -05:00
2015-07-24 13:02:42 -04:00
/* Save the settings
* 1 st check it ' s a logged in user calling
* 2 nd check the langfilter form is to be saved
* 3 rd save the settings to the DB for later usage
*/
2017-11-05 08:59:45 -05:00
function langfilter_addon_settings_post ( App $a , & $b )
{
if ( ! local_user ()) {
2015-07-24 13:02:42 -04:00
return ;
2017-11-05 08:59:45 -05:00
}
2015-07-24 13:02:42 -04:00
2017-11-05 08:59:45 -05:00
if ( $_POST [ 'langfilter-settings-submit' ]) {
2017-11-05 11:15:34 -05:00
PConfig :: set ( local_user (), 'langfilter' , 'languages' , trim ( $_POST [ 'langfilter_languages' ]));
2017-11-05 08:59:45 -05:00
$enable = (( x ( $_POST , 'langfilter_enable' )) ? intval ( $_POST [ 'langfilter_enable' ]) : 0 );
$disable = 1 - $enable ;
2017-11-05 11:15:34 -05:00
PConfig :: set ( local_user (), 'langfilter' , 'disable' , $disable );
2017-11-05 08:59:45 -05:00
$minconfidence = 0 + $_POST [ 'langfilter_minconfidence' ];
if ( ! $minconfidence ) {
$minconfidence = 0 ;
2017-11-05 11:15:34 -05:00
} elseif ( $minconfidence < 0 ) {
2017-11-05 08:59:45 -05:00
$minconfidence = 0 ;
2017-11-05 11:15:34 -05:00
} elseif ( $minconfidence > 100 ) {
2017-11-05 08:59:45 -05:00
$minconfidence = 100 ;
}
2017-11-05 11:15:34 -05:00
PConfig :: set ( local_user (), 'langfilter' , 'minconfidence' , $minconfidence / 100.0 );
2017-11-05 08:59:45 -05:00
$minlength = 0 + $_POST [ 'langfilter_minlength' ];
if ( ! $minlength ) {
$minlength = 32 ;
2017-11-05 11:15:34 -05:00
} elseif ( $minlengt8h < 0 ) {
2017-11-05 08:59:45 -05:00
$minlength = 32 ;
}
2017-11-05 11:15:34 -05:00
PConfig :: set ( local_user (), 'langfilter' , 'minlength' , $minlength );
2017-11-05 08:59:45 -05:00
2018-01-22 14:03:11 -05:00
info ( L10n :: t ( 'Language Filter Settings saved.' ) . EOL );
2015-07-24 13:02:42 -04:00
}
}
2017-11-05 08:59:45 -05:00
2015-07-24 13:02:42 -04:00
/* Actually filter postings by their language
* 1 st check if the user wants to filter postings
* 2 nd get the user settings which languages shall be not filtered out
2015-09-22 06:29:06 -04:00
* 3 rd extract the language of a posting
2015-07-24 13:02:42 -04:00
* 4 th if the determined language does not fit to the spoken languages
* of the user , then collapse the posting , but provide a link to
* expand it again .
*/
2018-04-04 22:51:44 -04:00
function langfilter_prepare_body_content_filter ( App $a , & $hook_data )
2017-11-05 08:59:45 -05:00
{
$logged_user = local_user ();
if ( ! $logged_user ) {
return ;
}
2015-09-09 13:41:38 -04:00
2017-11-05 08:59:45 -05:00
// Never filter own messages
// TODO: find a better way to extract this
2018-01-01 17:17:15 -05:00
$logged_user_profile = $a -> get_baseurl () . '/profile/' . $a -> user [ 'nickname' ];
2018-04-01 02:31:37 -04:00
if ( $logged_user_profile == $hook_data [ 'item' ][ 'author-link' ]) {
2017-11-05 08:59:45 -05:00
return ;
}
2015-07-24 13:02:42 -04:00
2017-11-05 08:59:45 -05:00
// Don't filter if language filter is disabled
2017-11-05 11:15:34 -05:00
if ( PConfig :: get ( $logged_user , 'langfilter' , 'disable' )) {
2017-11-05 08:59:45 -05:00
return ;
}
2015-09-10 03:54:26 -04:00
2018-04-21 18:47:18 -04:00
$naked_body = BBCode :: toPlaintext ( $hook_data [ 'item' ][ 'body' ], false );
2018-04-21 04:13:53 -04:00
2017-11-05 08:59:45 -05:00
// Don't filter if body lenght is below minimum
2018-04-21 04:13:53 -04:00
$minlen = PConfig :: get ( local_user (), 'langfilter' , 'minlength' , 32 );
2017-11-05 08:59:45 -05:00
if ( ! $minlen ) {
$minlen = 32 ;
}
2018-04-21 04:13:53 -04:00
if ( strlen ( $naked_body ) < $minlen ) {
2017-11-05 08:59:45 -05:00
return ;
}
2016-10-01 12:15:32 -04:00
2018-04-01 02:31:37 -04:00
$read_languages_string = PConfig :: get ( local_user (), 'langfilter' , 'languages' );
2017-11-05 11:15:34 -05:00
$minconfidence = PConfig :: get ( local_user (), 'langfilter' , 'minconfidence' );
2015-09-22 06:29:06 -04:00
2017-11-05 08:59:45 -05:00
// Don't filter if no spoken languages are configured
2018-04-01 02:31:37 -04:00
if ( ! $read_languages_string ) {
2017-11-05 08:59:45 -05:00
return ;
2018-04-01 02:31:37 -04:00
}
$read_languages_array = explode ( ',' , $read_languages_string );
2015-09-22 06:29:06 -04:00
2017-11-05 08:59:45 -05:00
// Extract the language of the post
2018-06-30 01:20:17 -04:00
if ( ! empty ( $hook_data [ 'item' ][ 'language' ])) {
$languages = json_decode ( $hook_data [ 'item' ][ 'language' ], true );
if ( ! is_array ( $languages )) {
return ;
}
2018-04-01 02:31:37 -04:00
2018-06-30 01:20:17 -04:00
foreach ( $languages as $iso2 => $confidence ) {
break ;
}
2015-09-22 06:29:06 -04:00
2018-06-30 01:20:17 -04:00
$lang = Text_LanguageDetect_ISO639 :: code2ToName ( $iso2 );
} else {
$opts = $hook_data [ 'item' ][ 'postopts' ];
if ( ! $opts ) {
// no options associated to post
return ;
}
if ( ! preg_match ( '/\blang=([^;]*);([^:]*)/' , $opts , $matches )) {
// no lang options associated to post
return ;
}
$lang = $matches [ 1 ];
$confidence = $matches [ 2 ];
$iso2 = Text_LanguageDetect_ISO639 :: nameToCode2 ( $lang );
}
2015-09-22 06:29:06 -04:00
2017-11-05 08:59:45 -05:00
// Do not filter if language detection confidence is too low
if ( $minconfidence && $confidence < $minconfidence ) {
return ;
}
2015-09-22 06:29:06 -04:00
2017-11-05 08:59:45 -05:00
if ( ! $iso2 ) {
return ;
}
2015-09-22 06:29:06 -04:00
2018-04-01 02:31:37 -04:00
if ( ! in_array ( $iso2 , $read_languages_array )) {
$hook_data [ 'filter_reasons' ][] = L10n :: t ( 'Filtered language: %s' , ucfirst ( $lang ));
2017-11-05 08:59:45 -05:00
}
2015-07-24 13:02:42 -04:00
}