diff options
author | Vsevolod Stakhov <vsevolod@highsecure.ru> | 2018-09-05 17:43:20 +0100 |
---|---|---|
committer | Vsevolod Stakhov <vsevolod@highsecure.ru> | 2018-09-05 17:44:35 +0100 |
commit | a64ce9b4245153e68fbbcd9c6610b9c1ccf76493 (patch) | |
tree | b9b9798b77974cf8d0793c948966a95963266771 /src/plugins/chartable.c | |
parent | 3807688a67be66d00a24172c13b00b6fb1816d69 (diff) | |
download | rspamd-a64ce9b4245153e68fbbcd9c6610b9c1ccf76493.tar.gz rspamd-a64ce9b4245153e68fbbcd9c6610b9c1ccf76493.zip |
[Rework] Rework utf content processing in text parts
- Store unicode in UTF parts
- Store unicode for HTML parts
- Rename struct fields and split them into unicode/utf components
Diffstat (limited to 'src/plugins/chartable.c')
-rw-r--r-- | src/plugins/chartable.c | 10 |
1 files changed, 5 insertions, 5 deletions
diff --git a/src/plugins/chartable.c b/src/plugins/chartable.c index 987879258..3c7157311 100644 --- a/src/plugins/chartable.c +++ b/src/plugins/chartable.c @@ -560,13 +560,13 @@ rspamd_chartable_process_part (struct rspamd_task *task, guint i, ncap = 0; gdouble cur_score = 0.0; - if (part == NULL || part->normalized_words == NULL || - part->normalized_words->len == 0) { + if (part == NULL || part->utf_words == NULL || + part->utf_words->len == 0) { return; } - for (i = 0; i < part->normalized_words->len; i++) { - w = &g_array_index (part->normalized_words, rspamd_stat_token_t, i); + for (i = 0; i < part->utf_words->len; i++) { + w = &g_array_index (part->utf_words, rspamd_stat_token_t, i); if (w->len > 0 && (w->flags & RSPAMD_STAT_TOKEN_FLAG_TEXT)) { @@ -588,7 +588,7 @@ rspamd_chartable_process_part (struct rspamd_task *task, */ part->capital_letters += ncap; - cur_score /= (gdouble)part->normalized_words->len; + cur_score /= (gdouble)part->utf_words->len; if (cur_score > 2.0) { cur_score = 2.0; |