From: Vsevolod Stakhov Date: Mon, 15 Jan 2018 20:23:00 +0000 (+0000) Subject: [Minor] Another adjustment to lang_detection X-Git-Tag: 1.7.0~275 X-Git-Url: https://source.dussan.org/?a=commitdiff_plain;h=dc77c863434b31c195fd95c9b81b1a25dcc80385;p=rspamd.git [Minor] Another adjustment to lang_detection --- diff --git a/src/libmime/lang_detection.c b/src/libmime/lang_detection.c index 374e38f83..17042f1a9 100644 --- a/src/libmime/lang_detection.c +++ b/src/libmime/lang_detection.c @@ -751,7 +751,7 @@ rspamd_language_detector_detect (struct rspamd_lang_detector *d, /* Try to improve guess */ tcandidates = g_hash_table_new_full (rspamd_str_hash, rspamd_str_equal, NULL, g_free); - r = rspamd_language_detector_try_ngramm (d, ucs_tokens, rs_bigramm, + r = rspamd_language_detector_try_ngramm (d, ucs_tokens, rs_trigramm, tcandidates); switch (r) { @@ -789,15 +789,16 @@ rspamd_language_detector_detect (struct rspamd_lang_detector *d, g_hash_table_unref (candidates); candidates = tcandidates; - msg_err ("bigramms checked, %.3f mean, %.4f stddev", mean, std); + msg_err ("trigramms checked, %.3f mean, %.4f stddev", mean, std); - if (std / fabs (mean) < 0.3) { + if (std / fabs (mean) < 0.01) { /* Try trigramms */ tcandidates = g_hash_table_new_full (rspamd_str_hash, rspamd_str_equal, NULL, g_free); - r = rspamd_language_detector_try_ngramm (d, ucs_tokens, rs_trigramm, + r = rspamd_language_detector_try_ngramm (d, ucs_tokens, + rs_trigramm, tcandidates); if (r != rs_detect_none) {