diff options
author | Vsevolod Stakhov <vsevolod@highsecure.ru> | 2015-10-06 16:14:29 +0100 |
---|---|---|
committer | Vsevolod Stakhov <vsevolod@highsecure.ru> | 2015-10-06 16:14:29 +0100 |
commit | d70fb7a4a7938936295a1ec263eba607adb26f69 (patch) | |
tree | 51bbef6ac3c702f7a2535ed1a66b7504433e5595 /src/libstat | |
parent | 2097ac107b192d6c244244ca425d012ebfcff09c (diff) | |
download | rspamd-d70fb7a4a7938936295a1ec263eba607adb26f69.tar.gz rspamd-d70fb7a4a7938936295a1ec263eba607adb26f69.zip |
Fix statistics.
Diffstat (limited to 'src/libstat')
-rw-r--r-- | src/libstat/learn_cache/sqlite3_cache.c | 4 | ||||
-rw-r--r-- | src/libstat/stat_process.c | 4 | ||||
-rw-r--r-- | src/libstat/tokenizers/osb.c | 4 | ||||
-rw-r--r-- | src/libstat/tokenizers/tokenizers.c | 27 | ||||
-rw-r--r-- | src/libstat/tokenizers/tokenizers.h | 2 |
5 files changed, 20 insertions, 21 deletions
diff --git a/src/libstat/learn_cache/sqlite3_cache.c b/src/libstat/learn_cache/sqlite3_cache.c index 6eabaefda..987f6cb0c 100644 --- a/src/libstat/learn_cache/sqlite3_cache.c +++ b/src/libstat/learn_cache/sqlite3_cache.c @@ -247,7 +247,7 @@ rspamd_stat_cache_sqlite3_process (struct rspamd_task *task, struct rspamd_stat_sqlite3_ctx *ctx = (struct rspamd_stat_sqlite3_ctx *)c; struct mime_text_part *part; blake2b_state st; - rspamd_fstring_t *word; + rspamd_ftok_t *word; guchar out[BLAKE2B_OUTBYTES]; guint i, j; @@ -259,7 +259,7 @@ rspamd_stat_cache_sqlite3_process (struct rspamd_task *task, if (part->words != NULL) { for (j = 0; j < part->words->len; j ++) { - word = &g_array_index (part->words, rspamd_fstring_t, j); + word = &g_array_index (part->words, rspamd_ftok_t, j); blake2b_update (&st, word->begin, word->len); } } diff --git a/src/libstat/stat_process.c b/src/libstat/stat_process.c index a6f5d31ae..a1cbe9c33 100644 --- a/src/libstat/stat_process.c +++ b/src/libstat/stat_process.c @@ -52,7 +52,7 @@ rspamd_stat_tokenize_header (struct rspamd_task *task, const gchar *name, const gchar *prefix, GArray *ar) { struct raw_header *rh, *cur; - rspamd_fstring_t str; + rspamd_ftok_t str; rh = g_hash_table_lookup (task->raw_headers, name); @@ -89,7 +89,7 @@ rspamd_stat_tokenize_parts_metadata (struct rspamd_task *task, struct mime_text_part *tp; GList *cur; GArray *ar; - rspamd_fstring_t elt; + rspamd_ftok_t elt; guint i; ar = g_array_sized_new (FALSE, FALSE, sizeof (elt), 4); diff --git a/src/libstat/tokenizers/osb.c b/src/libstat/tokenizers/osb.c index 690a7ab5b..7744e2883 100644 --- a/src/libstat/tokenizers/osb.c +++ b/src/libstat/tokenizers/osb.c @@ -232,7 +232,7 @@ rspamd_tokenizer_osb (struct rspamd_tokenizer_runtime *rt, const gchar *prefix) { rspamd_token_t *new = NULL; - rspamd_fstring_t *token; + rspamd_ftok_t *token; struct rspamd_osb_tokenizer_config *osb_cf; guint64 *hashpipe, cur, seed; guint32 h1, h2; @@ -259,7 +259,7 @@ rspamd_tokenizer_osb (struct rspamd_tokenizer_runtime *rt, memset (hashpipe, 0xfe, window_size * sizeof (hashpipe[0])); for (w = 0; w < input->len; w ++) { - token = &g_array_index (input, rspamd_fstring_t, w); + token = &g_array_index (input, rspamd_ftok_t, w); if (osb_cf->ht == RSPAMD_OSB_HASH_COMPAT) { cur = rspamd_fstrhash_lc (token, is_utf); diff --git a/src/libstat/tokenizers/tokenizers.c b/src/libstat/tokenizers/tokenizers.c index 07e7a1f45..439c639a6 100644 --- a/src/libstat/tokenizers/tokenizers.c +++ b/src/libstat/tokenizers/tokenizers.c @@ -30,8 +30,8 @@ #include "tokenizers.h" #include "stat_internal.h" -typedef gboolean (*token_get_function) (rspamd_fstring_t * buf, gchar **pos, - rspamd_fstring_t * token, +typedef gboolean (*token_get_function) (rspamd_ftok_t * buf, gchar const **pos, + rspamd_ftok_t * token, GList **exceptions, gboolean is_utf, gsize *rl, gboolean check_signature); const gchar t_delimiters[255] = { @@ -77,12 +77,12 @@ token_node_compare_func (gconstpointer a, gconstpointer b) /* Get next word from specified f_str_t buf */ static gboolean -rspamd_tokenizer_get_word_compat (rspamd_fstring_t * buf, - gchar **cur, rspamd_fstring_t * token, +rspamd_tokenizer_get_word_compat (rspamd_ftok_t * buf, + gchar const **cur, rspamd_ftok_t * token, GList **exceptions, gboolean is_utf, gsize *rl, gboolean unused) { gsize remain, pos; - guchar *p; + const gchar *p; struct process_exception *ex = NULL; if (buf == NULL) { @@ -134,11 +134,11 @@ rspamd_tokenizer_get_word_compat (rspamd_fstring_t * buf, pos++; p++; remain--; - } while (remain > 0 && t_delimiters[*p]); + } while (remain > 0 && t_delimiters[(guchar)*p]); token->begin = p; - while (remain > 0 && !t_delimiters[*p]) { + while (remain > 0 && !t_delimiters[(guchar)*p]) { if (ex != NULL && ex->pos == pos) { *exceptions = g_list_next (*exceptions); *cur = p + ex->len; @@ -169,13 +169,13 @@ rspamd_tokenizer_get_word_compat (rspamd_fstring_t * buf, } static gboolean -rspamd_tokenizer_get_word (rspamd_fstring_t * buf, - gchar **cur, rspamd_fstring_t * token, +rspamd_tokenizer_get_word (rspamd_ftok_t * buf, + gchar const **cur, rspamd_ftok_t * token, GList **exceptions, gboolean is_utf, gsize *rl, gboolean check_signature) { gsize remain, pos, siglen = 0; - gchar *p, *next_p, *sig = NULL; + const gchar *p, *next_p, *sig = NULL; gunichar uc; guint processed = 0; struct process_exception *ex = NULL; @@ -292,8 +292,8 @@ rspamd_tokenize_text (gchar *text, gsize len, gboolean is_utf, gsize min_len, GList *exceptions, gboolean compat, gboolean check_signature) { - rspamd_fstring_t token, buf; - gchar *pos = NULL; + rspamd_ftok_t token, buf; + const gchar *pos = NULL; gsize l; GArray *res; GList *cur = exceptions; @@ -305,7 +305,6 @@ rspamd_tokenize_text (gchar *text, gsize len, gboolean is_utf, buf.begin = text; buf.len = len; - buf.size = buf.len; token.begin = NULL; token.len = 0; @@ -316,7 +315,7 @@ rspamd_tokenize_text (gchar *text, gsize len, gboolean is_utf, func = rspamd_tokenizer_get_word; } - res = g_array_sized_new (FALSE, FALSE, sizeof (rspamd_fstring_t), 128); + res = g_array_sized_new (FALSE, FALSE, sizeof (rspamd_ftok_t), 128); while (func (&buf, &pos, &token, &cur, is_utf, &l, FALSE)) { if (l == 0 || (min_len > 0 && l < min_len)) { diff --git a/src/libstat/tokenizers/tokenizers.h b/src/libstat/tokenizers/tokenizers.h index 7b01d9fe8..4689d1cc6 100644 --- a/src/libstat/tokenizers/tokenizers.h +++ b/src/libstat/tokenizers/tokenizers.h @@ -33,7 +33,7 @@ struct rspamd_stat_tokenizer { gint token_node_compare_func (gconstpointer a, gconstpointer b); -/* Tokenize text into array of words (rspamd_fstring_t type) */ +/* Tokenize text into array of words (rspamd_ftok_t type) */ GArray * rspamd_tokenize_text (gchar *text, gsize len, gboolean is_utf, gsize min_len, GList *exceptions, gboolean compat, gboolean check_signature); |