summaryrefslogtreecommitdiffstats
path: root/src/plugins/lua/spamassassin.lua
diff options
context:
space:
mode:
authorVsevolod Stakhov <vsevolod@highsecure.ru>2015-11-23 13:48:11 +0000
committerVsevolod Stakhov <vsevolod@highsecure.ru>2015-11-23 13:48:11 +0000
commit3e3b6e8185b8e19794e7dbd2515f60e2bbc81983 (patch)
tree3a78a1cca5577ddbff5fb3cfc6174feeb5257369 /src/plugins/lua/spamassassin.lua
parent88a9da36c51e0e53afffab9eecf94c65066d99e5 (diff)
downloadrspamd-3e3b6e8185b8e19794e7dbd2515f60e2bbc81983.tar.gz
rspamd-3e3b6e8185b8e19794e7dbd2515f60e2bbc81983.zip
Rework SA plugin for some problematic cases
Diffstat (limited to 'src/plugins/lua/spamassassin.lua')
-rw-r--r--src/plugins/lua/spamassassin.lua109
1 files changed, 88 insertions, 21 deletions
diff --git a/src/plugins/lua/spamassassin.lua b/src/plugins/lua/spamassassin.lua
index fb1998d98..7f5376019 100644
--- a/src/plugins/lua/spamassassin.lua
+++ b/src/plugins/lua/spamassassin.lua
@@ -42,7 +42,9 @@ local known_plugins = {
'Mail::SpamAssassin::Plugin::FreeMail',
'Mail::SpamAssassin::Plugin::HeaderEval',
'Mail::SpamAssassin::Plugin::ReplaceTags',
- 'Mail::SpamAssassin::Plugin::RelayEval'
+ 'Mail::SpamAssassin::Plugin::RelayEval',
+ 'Mail::SpamAssassin::Plugin::MIMEEval',
+ 'Mail::SpamAssassin::Plugin::BodyEval'
}
-- Internal variables
@@ -61,8 +63,9 @@ local replace = {
rules = {},
}
local internal_regexp = {
- date_shift = rspamd_regexp.create_cached("^\\(\\s*'((?:-?\\d+)|(?:undef))'\\s*,\\s*'((?:-?\\d+)|(?:undef))'\\s*\\)$")
+ date_shift = rspamd_regexp.create("^\\(\\s*'((?:-?\\d+)|(?:undef))'\\s*,\\s*'((?:-?\\d+)|(?:undef))'\\s*\\)$")
}
+local func_cache = {}
local section = rspamd_config:get_all_opt("spamassassin")
-- Minimum score to treat symbols as meta
@@ -85,6 +88,10 @@ local function split(str, delim)
return result
end
+local function trim(s)
+ return s:match "^%s*(.-)%s*$"
+end
+
local function handle_header_def(hline, cur_rule)
--Now check for modifiers inside header's name
local hdrs = split(hline, '[^|]+')
@@ -304,7 +311,6 @@ local function maybe_parse_sa_function(line)
local arg
local elts = split(line, '[^:]+')
arg = elts[2]
- local func_cache = {}
rspamd_logger.debugx(rspamd_config, 'trying to parse SA function %1 with args %2',
elts[1], elts[2])
@@ -388,6 +394,9 @@ local function process_sa_conf(f)
cur_rule['symbol'] = nsym
end
-- We have previous rule valid
+ if not cur_rule['symbol'] then
+ rspamd_logger.errx(rspamd_config, 'bad rule definition: %1', cur_rule)
+ end
rules[cur_rule['symbol']] = cur_rule
cur_rule = {}
valid_rule = false
@@ -411,16 +420,24 @@ local function process_sa_conf(f)
end
local skip_to_endif = false
+ local if_nested = 0
for l in f:lines() do
(function ()
- if string.len(l) == 0 or
- _.nth(1, _.drop_while(function(c) return c == ' ' end, _.iter(l))) == '#' then
+ l = trim(l)
+
+ if string.len(l) == 0 or string.sub(l, 1, 1) == '#' then
return
end
if skip_to_endif then
if string.match(l, '^endif') then
- skip_to_endif = false
+ if_nested = if_nested - 1
+
+ if if_nested == 0 then
+ skip_to_endif = false
+ end
+ elseif string.match(l, '^if') then
+ if_nested = if_nested + 1
end
return
else
@@ -432,7 +449,21 @@ local function process_sa_conf(f)
return false
end, known_plugins) then
skip_to_endif = true
+ if_nested = 1
end
+ elseif string.match(l, '^if !plugin%(') then
+ local pname = string.match(l, '^if !plugin%(([A-Za-z:]+)%)')
+ if _.any(function(pl)
+ if pl == pname then return true end
+ return false
+ end, known_plugins) then
+ skip_to_endif = true
+ if_nested = 1
+ end
+ elseif string.match(l, '^if') then
+ -- Unknown if
+ skip_to_endif = true
+ if_nested = 1
end
end
@@ -497,33 +528,69 @@ local function process_sa_conf(f)
rspamd_logger.infox(rspamd_config, 'unknown function %1', args)
end
end
- elseif words[1] == "body" and slash then
+ elseif words[1] == "body" then
-- body SYMBOL /regexp/
if valid_rule then
insert_cur_rule()
end
- cur_rule['type'] = 'part'
+
cur_rule['symbol'] = words[2]
- cur_rule['re_expr'] = words_to_re(words, 2)
- cur_rule['re'] = rspamd_regexp.create_cached(cur_rule['re_expr'])
- cur_rule['raw'] = true
- if cur_rule['re'] and cur_rule['symbol'] then
- valid_rule = true
- cur_rule['re']:set_limit(match_limit)
+ if words[3] and (string.sub(words[3], 1, 1) == '/'
+ or string.sub(words[3], 1, 1) == 'm') then
+ cur_rule['type'] = 'part'
+ cur_rule['re_expr'] = words_to_re(words, 2)
+ cur_rule['re'] = rspamd_regexp.create_cached(cur_rule['re_expr'])
+ cur_rule['raw'] = true
+ if cur_rule['re'] then
+ valid_rule = true
+ cur_rule['re']:set_limit(match_limit)
+ end
+ else
+ -- might be function
+ local args = words_to_re(words, 2)
+ local func = maybe_parse_sa_function(args)
+
+ if func then
+ cur_rule['type'] = 'function'
+ cur_rule['symbol'] = words[2]
+ cur_rule['function'] = func
+ valid_rule = true
+ else
+ rspamd_logger.infox(rspamd_config, 'unknown function %1', args)
+ end
end
- elseif words[1] == "rawbody" or words[1] == "full" and slash then
+ elseif words[1] == "rawbody" or words[1] == "full" then
-- body SYMBOL /regexp/
if valid_rule then
insert_cur_rule()
end
- cur_rule['type'] = 'message'
+
cur_rule['symbol'] = words[2]
- cur_rule['re_expr'] = words_to_re(words, 2)
- cur_rule['re'] = rspamd_regexp.create_cached(cur_rule['re_expr'])
- if cur_rule['re'] and cur_rule['symbol'] then
- valid_rule = true
- cur_rule['re']:set_limit(match_limit)
+
+ if words[3] and (string.sub(words[3], 1, 1) == '/'
+ or string.sub(words[3], 1, 1) == 'm') then
+ cur_rule['type'] = 'message'
+ cur_rule['re_expr'] = words_to_re(words, 2)
+ cur_rule['re'] = rspamd_regexp.create_cached(cur_rule['re_expr'])
+ cur_rule['raw'] = true
+ if cur_rule['re'] then
+ valid_rule = true
+ cur_rule['re']:set_limit(match_limit)
+ end
+ else
+ -- might be function
+ local args = words_to_re(words, 2)
+ local func = maybe_parse_sa_function(args)
+
+ if func then
+ cur_rule['type'] = 'function'
+ cur_rule['symbol'] = words[2]
+ cur_rule['function'] = func
+ valid_rule = true
+ else
+ rspamd_logger.infox(rspamd_config, 'unknown function %1', args)
+ end
end
elseif words[1] == "uri" then
-- uri SYMBOL /regexp/