diff options
author | Vsevolod Stakhov <vsevolod@rambler-co.ru> | 2011-06-03 20:23:13 +0400 |
---|---|---|
committer | Vsevolod Stakhov <vsevolod@rambler-co.ru> | 2011-06-03 20:23:13 +0400 |
commit | 92de380c2c5e8ce7073ce979df4e5c7868e52bb6 (patch) | |
tree | 27be3202d27f129f3d94d90298a4d1e0ecf2c281 /src/controller.c | |
parent | 83a9452974ec2f9c7be262a77e54a1ea2557c795 (diff) | |
download | rspamd-92de380c2c5e8ce7073ce979df4e5c7868e52bb6.tar.gz rspamd-92de380c2c5e8ce7073ce979df4e5c7868e52bb6.zip |
* Skip short utf words in statistics
Diffstat (limited to 'src/controller.c')
-rw-r--r-- | src/controller.c | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/src/controller.c b/src/controller.c index b29af9ee1..f69a90f8b 100644 --- a/src/controller.c +++ b/src/controller.c @@ -851,7 +851,7 @@ controller_read_socket (f_str_t * in, void *arg) c.begin = part->content->data; c.len = part->content->len; if (!session->learn_classifier->tokenizer->tokenize_func (session->learn_classifier->tokenizer, - session->session_pool, &c, &tokens, FALSE)) { + session->session_pool, &c, &tokens, FALSE, part->is_utf)) { i = rspamd_snprintf (out_buf, sizeof (out_buf), "weights failed, tokenizer error" CRLF END); free_task (task, FALSE); if (!rspamd_dispatcher_write (session->dispatcher, out_buf, i, FALSE, FALSE)) { |