X-Git-Url: https://git.mxchange.org/?a=blobdiff_plain;f=langfilter%2Flangfilter.php;h=0aa136205025bce34e496ba6a14f2322eb6e4169;hb=d20e60ef9180ea7c0c921a03de5466a04b286565;hp=bbdc47fe2a9aae1bca18350692a2e4a532738128;hpb=5b2c4dfed90c1c49ec78b06652dfc4ce42a19946;p=friendica-addons.git diff --git a/langfilter/langfilter.php b/langfilter/langfilter.php index bbdc47fe..0aa13620 100644 --- a/langfilter/langfilter.php +++ b/langfilter/langfilter.php @@ -1,4 +1,5 @@ t("Language Filter"), - '$intro' => t ('This addon tries to identify the language of a postings. If it does not match any language spoken by you (see below) the posting will be collapsed. Remember detecting the language is not perfect, especially with short postings.'), - '$enabled' => array('langfilter_enable', t('Use the language filter'), $enable_checked, ''), - '$languages' => array('langfilter_languages', t('I speak'), $languages, t('List of abbreviations for languages you speak, comma seperated. For excample "de,it".') ), - '$submit' => t('Save Settings'), + $t = get_markup_template("settings.tpl", "addon/langfilter/"); + $s .= replace_macros($t, array( + '$title' => t("Language Filter"), + '$intro' => t('This addon tries to identify the language of a postings. If it does not match any language spoken by you (see below) the posting will be collapsed. Remember detecting the language is not perfect, especially with short postings.'), + '$enabled' => array('langfilter_enable', t('Use the language filter'), $enable_checked, ''), + '$languages' => array('langfilter_languages', t('I speak'), $languages, t('List of abbreviations (iso2 codes) for languages you speak, comma separated. For example "de,it".')), + '$minconfidence' => array('langfilter_minconfidence', t('Minimum confidence in language detection'), $minconfidence, t('Minimum confidence in language detection being correct, from 0 to 100. Posts will not be filtered when the confidence of language detection is below this percent value.')), + '$minlength' => array('langfilter_minlength', t('Minimum length of message body'), $minlength, t('Minimum length of message body for language filter to be used. Posts shorter than this number of characters will not be filtered.')), + '$submit' => t('Save Settings'), )); return; } + /* Save the settings * 1st check it's a logged in user calling * 2nd check the langfilter form is to be saved * 3rd save the settings to the DB for later usage */ -function langfilter_addon_settings_post(&$a,&$b) { - if(! local_user()) + +function langfilter_addon_settings_post(App $a, &$b) +{ + if (!local_user()) { return; + } + + if ($_POST['langfilter-settings-submit']) { + PConfig::set(local_user(), 'langfilter', 'languages', trim($_POST['langfilter_languages'])); + $enable = ((x($_POST, 'langfilter_enable')) ? intval($_POST['langfilter_enable']) : 0); + $disable = 1 - $enable; + PConfig::set(local_user(), 'langfilter', 'disable', $disable); + $minconfidence = 0 + $_POST['langfilter_minconfidence']; + if (!$minconfidence) { + $minconfidence = 0; + } elseif ($minconfidence < 0) { + $minconfidence = 0; + } elseif ($minconfidence > 100) { + $minconfidence = 100; + } + PConfig::set(local_user(), 'langfilter', 'minconfidence', $minconfidence / 100.0); - if($_POST['langfilter-settings-submit']) { - set_pconfig(local_user(),'langfilter','languages',trim($_POST['langfilter_languages'])); - $enable = ((x($_POST,'langfilter_enable')) ? intval($_POST['langfilter_enable']) : 0); - $disable = 1-$enable; - set_pconfig(local_user(),'langfilter','disable', $disable); - info( t('Language Filter Settings saved.') . EOL); + $minlength = 0 + $_POST['langfilter_minlength']; + if (!$minlength) { + $minlength = 32; + } elseif ($minlengt8h < 0) { + $minlength = 32; + } + PConfig::set(local_user(), 'langfilter', 'minlength', $minlength); + + info(t('Language Filter Settings saved.') . EOL); } } + /* Actually filter postings by their language * 1st check if the user wants to filter postings * 2nd get the user settings which languages shall be not filtered out - * 3rd determine the language of a posting + * 3rd extract the language of a posting * 4th if the determined language does not fit to the spoken languages * of the user, then collapse the posting, but provide a link to * expand it again. */ -function langfilter_prepare_body(&$a,&$b) { - if(get_pconfig(local_user(),'langfilter','disable')) + +function langfilter_prepare_body(App $a, &$b) +{ + $logged_user = local_user(); + if (!$logged_user) { return; + } - # Never filter own messages - # TODO: find a better way to extract this + // Never filter own messages + // TODO: find a better way to extract this $logged_user_profile = $a->config['system']['url'] . '/profile/' . $a->user['nickname']; - if ( $logged_user_profile == $b['item']['author-link'] ) return; + if ($logged_user_profile == $b['item']['author-link']) { + return; + } - if(local_user()) { - $langs = get_pconfig(local_user(),'langfilter','languages'); + // Don't filter if language filter is disabled + if (PConfig::get($logged_user, 'langfilter', 'disable')) { + return; + } + + // Don't filter if body lenght is below minimum + $minlen = PConfig::get(local_user(), 'langfilter', 'minlength'); + if (!$minlen) { + $minlen = 32; } - if($langs) { - $arr = explode(',',$langs); - } else { + if (strlen($b['item']['body']) < $minlen) { return; } - $found = false; - $l = new Text_LanguageDetect; - $l->_name_mode = 2; // two letter codes - $l->_threshold = 600; // make it a bit harder to be confident with a lng - // IOW make it more possible that lng is correct - $lng = $l->detectSimple($b['html']); - if ($lng==null) + $spoken_config = PConfig::get(local_user(), 'langfilter', 'languages'); + $minconfidence = PConfig::get(local_user(), 'langfilter', 'minconfidence'); + + // Don't filter if no spoken languages are configured + if (!$spoken_config) return; - if (! in_array($lng, $arr)) - $found = true; - if ($lng==null) - $found = false; + $spoken_languages = explode(',', $spoken_config); + + // Extract the language of the post + $opts = $b['item']['postopts']; + if (!$opts) { + // no options associated to post + return; + } + if (!preg_match('/\blang=([^;]*);([^:]*)/', $opts, $matches)) { + // no lang options associated to post + return; + } + + $lang = $matches[1]; + $confidence = $matches[2]; + + // Do not filter if language detection confidence is too low + if ($minconfidence && $confidence < $minconfidence) { + return; + } + + $iso2 = Text_LanguageDetect_ISO639::nameToCode2($lang); + + if (!$iso2) { + return; + } + $spoken = in_array($iso2, $spoken_languages); - if($found) { + if (!$spoken) { $rnd = random_string(8); - $b['html'] = ''; + $b['html'] = ''; } } -?>