diff options
author | Vsevolod Stakhov <vsevolod@highsecure.ru> | 2020-02-24 11:59:40 +0000 |
---|---|---|
committer | Vsevolod Stakhov <vsevolod@highsecure.ru> | 2020-02-24 11:59:40 +0000 |
commit | cfdf17ea1a26abce66d11319a02faaa33132cf9e (patch) | |
tree | 43e500a7a2837d3a02d779c7ca244b3d50ae0d6b /src/plugins | |
parent | e0e0d361a445a4f5cca9bdc77a23dbdfe75bebed (diff) | |
download | rspamd-cfdf17ea1a26abce66d11319a02faaa33132cf9e.tar.gz rspamd-cfdf17ea1a26abce66d11319a02faaa33132cf9e.zip |
[Fix] Avoid collisions in mempool variables by changing fuzzy caching logic
Diffstat (limited to 'src/plugins')
-rw-r--r-- | src/plugins/fuzzy_check.c | 68 |
1 files changed, 47 insertions, 21 deletions
diff --git a/src/plugins/fuzzy_check.c b/src/plugins/fuzzy_check.c index 4df88e2a8..475417147 100644 --- a/src/plugins/fuzzy_check.c +++ b/src/plugins/fuzzy_check.c @@ -1343,35 +1343,59 @@ struct rspamd_cached_shingles { guchar digest[rspamd_cryptobox_HASHBYTES]; }; + static struct rspamd_cached_shingles * fuzzy_cmd_get_cached (struct fuzzy_rule *rule, - rspamd_mempool_t *pool, - gpointer p) + struct rspamd_task *task, + struct rspamd_mime_part *mp) { gchar key[32]; gint key_part; + struct rspamd_cached_shingles **cached; memcpy (&key_part, rule->shingles_key->str, sizeof (key_part)); - rspamd_snprintf (key, sizeof (key), "%p%s%d", p, rule->algorithm_str, + rspamd_snprintf (key, sizeof (key), "%s%d", rule->algorithm_str, key_part); - return rspamd_mempool_get_variable (pool, key); + cached = (struct rspamd_cached_shingles **)rspamd_mempool_get_variable ( + task->task_pool, key); + + if (cached && cached[mp->part_number]) { + return cached[mp->part_number]; + } + + return NULL; } static void fuzzy_cmd_set_cached (struct fuzzy_rule *rule, - rspamd_mempool_t *pool, - gpointer p, - struct rspamd_cached_shingles *data) + struct rspamd_task *task, + struct rspamd_mime_part *mp, + struct rspamd_cached_shingles *data) { gchar key[32]; gint key_part; + struct rspamd_cached_shingles **cached; memcpy (&key_part, rule->shingles_key->str, sizeof (key_part)); - rspamd_snprintf (key, sizeof (key), "%p%s%d", p, rule->algorithm_str, + rspamd_snprintf (key, sizeof (key), "%s%d", rule->algorithm_str, key_part); - /* Key is copied */ - rspamd_mempool_set_variable (pool, key, data, NULL); + + cached = (struct rspamd_cached_shingles **)rspamd_mempool_get_variable ( + task->task_pool, key); + + if (cached) { + cached[mp->part_number] = data; + } + else { + cached = rspamd_mempool_alloc0 (task->task_pool, sizeof (*cached) * + (MESSAGE_FIELD (task, parts)->len + 1)); + cached[mp->part_number] = data; + + rspamd_mempool_set_variable (task->task_pool, key, cached, NULL); + } + + } static gboolean @@ -1447,7 +1471,7 @@ fuzzy_cmd_from_text_part (struct rspamd_task *task, GArray *words; struct fuzzy_cmd_io *io; - cached = fuzzy_cmd_get_cached (rule, pool, mp); + cached = fuzzy_cmd_get_cached (rule, task, mp); if (cached) { /* Copy cached */ @@ -1538,7 +1562,7 @@ fuzzy_cmd_from_text_part (struct rspamd_task *task, * Since it is copied when obtained from the cache, it is safe to use * it this way. */ - fuzzy_cmd_set_cached (rule, pool, mp, cached); + fuzzy_cmd_set_cached (rule, task, mp, cached); } io = rspamd_mempool_alloc (pool, sizeof (*io)); @@ -1601,12 +1625,13 @@ fuzzy_cmd_from_text_part (struct rspamd_task *task, return io; } +#if 0 static struct fuzzy_cmd_io * fuzzy_cmd_from_image_part (struct fuzzy_rule *rule, int c, gint flag, guint32 weight, - rspamd_mempool_t *pool, + struct rspamd_task *task, struct rspamd_image *img, struct rspamd_mime_part *mp) { @@ -1616,11 +1641,11 @@ fuzzy_cmd_from_image_part (struct fuzzy_rule *rule, struct rspamd_shingle *sh; struct rspamd_cached_shingles *cached; - cached = fuzzy_cmd_get_cached (rule, pool, mp); + cached = fuzzy_cmd_get_cached (rule, task, mp); if (cached) { /* Copy cached */ - encshcmd = rspamd_mempool_alloc0 (pool, sizeof (*encshcmd)); + encshcmd = rspamd_mempool_alloc0 (task->task_pool, sizeof (*encshcmd)); shcmd = &encshcmd->cmd; memcpy (&shcmd->sgl, cached->sh, sizeof (struct rspamd_shingle)); memcpy (shcmd->basic.digest, cached->digest, @@ -1628,14 +1653,14 @@ fuzzy_cmd_from_image_part (struct fuzzy_rule *rule, shcmd->basic.shingles_count = RSPAMD_SHINGLE_SIZE; } else { - encshcmd = rspamd_mempool_alloc0 (pool, sizeof (*encshcmd)); + encshcmd = rspamd_mempool_alloc0 (task->task_pool, sizeof (*encshcmd)); shcmd = &encshcmd->cmd; /* * Generate shingles */ sh = rspamd_shingles_from_image (img->dct, - rule->shingles_key->str, pool, + rule->shingles_key->str, task->task_pool, rspamd_shingles_default_filter, NULL, rule->alg); if (sh != NULL) { @@ -1652,7 +1677,7 @@ fuzzy_cmd_from_image_part (struct fuzzy_rule *rule, (const guchar *)img->dct, RSPAMD_DCT_LEN / NBBY, rule->hash_key->str, rule->hash_key->len); - msg_debug_pool ("loading shingles of type %s with key %*xs", + msg_debug_task ("loading shingles of type %s with key %*xs", rule->algorithm_str, 16, rule->shingles_key->str); @@ -1663,10 +1688,10 @@ fuzzy_cmd_from_image_part (struct fuzzy_rule *rule, * Since it is copied when obtained from the cache, it is safe to use * it this way. */ - cached = rspamd_mempool_alloc (pool, sizeof (*cached)); + cached = rspamd_mempool_alloc (task->task_pool, sizeof (*cached)); cached->sh = sh; memcpy (cached->digest, shcmd->basic.digest, sizeof (cached->digest)); - fuzzy_cmd_set_cached (rule, pool, mp, cached); + fuzzy_cmd_set_cached (rule, task, mp, cached); } shcmd->basic.tag = ottery_rand_uint32 (); @@ -1678,7 +1703,7 @@ fuzzy_cmd_from_image_part (struct fuzzy_rule *rule, shcmd->basic.value = weight; } - io = rspamd_mempool_alloc (pool, sizeof (*io)); + io = rspamd_mempool_alloc (task->task_pool, sizeof (*io)); io->part = mp; io->tag = shcmd->basic.tag; io->flags = FUZZY_CMD_FLAG_IMAGE; @@ -1697,6 +1722,7 @@ fuzzy_cmd_from_image_part (struct fuzzy_rule *rule, return io; } +#endif static struct fuzzy_cmd_io * fuzzy_cmd_from_data_part (struct fuzzy_rule *rule, |