1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
|
/**
* @file cfg_file.h
* Config file parser and config routines API
*/
#ifndef CFG_FILE_H
#define CFG_FILE_H
#include "config.h"
#include "mem_pool.h"
#include "upstream.h"
#include "symbols_cache.h"
#include "cfg_rcl.h"
#include "ucl.h"
#include "regexp.h"
#define DEFAULT_BIND_PORT 11333
#define DEFAULT_CONTROL_PORT 11334
/* Default metric name */
#define DEFAULT_METRIC "default"
struct expression;
struct tokenizer;
struct rspamd_stat_classifier;
struct module_s;
struct worker_s;
enum { VAL_UNDEF=0, VAL_TRUE, VAL_FALSE };
/**
* Type of time configuration parameter
*/
enum time_type {
TIME_SECONDS = 0,
TIME_MILLISECONDS,
TIME_MINUTES,
TIME_HOURS
};
/**
* Types of rspamd bind lines
*/
enum rspamd_cred_type {
CRED_NORMAL,
CRED_CONTROL,
CRED_LMTP,
CRED_DELIVERY
};
/**
* Logging type
*/
enum rspamd_log_type {
RSPAMD_LOG_CONSOLE,
RSPAMD_LOG_SYSLOG,
RSPAMD_LOG_FILE
};
/**
* script module list item
*/
struct script_module {
gchar *name; /**< name of module */
gchar *path; /**< path to module */
};
/**
* Type of lua variable
*/
enum lua_var_type {
LUA_VAR_NUM,
LUA_VAR_BOOLEAN,
LUA_VAR_STRING,
LUA_VAR_FUNCTION,
LUA_VAR_UNKNOWN
};
/**
* Symbols group
*/
struct rspamd_symbol_def;
struct rspamd_symbols_group {
gchar *name;
GHashTable *symbols;
gdouble max_score;
gboolean disabled;
gboolean one_shot;
};
/**
* Symbol definition
*/
struct rspamd_symbol_def {
gchar *name;
gchar *description;
gdouble *weight_ptr;
gdouble score;
struct rspamd_symbols_group *gr;
GList *groups;
gboolean one_shot;
};
typedef double (*statfile_normalize_func)(struct rspamd_config *cfg,
long double score, void *params);
/**
* Statfile config definition
*/
struct rspamd_statfile_config {
gchar *symbol; /**< symbol of statfile */
gchar *label; /**< label of this statfile */
ucl_object_t *opts; /**< other options */
gboolean is_spam; /**< spam flag */
struct rspamd_classifier_config *clcf; /**< parent pointer of classifier configuration */
gpointer data; /**< opaque data */
};
struct rspamd_tokenizer_config {
const ucl_object_t *opts; /**< other options */
const gchar *name; /**< name of tokenizer */
};
/**
* Classifier config definition
*/
struct rspamd_classifier_config {
GList *statfiles; /**< statfiles list */
GHashTable *labels; /**< statfiles with labels */
gchar *metric; /**< metric of this classifier */
gchar *classifier; /**< classifier interface */
struct rspamd_tokenizer_config *tokenizer; /**< tokenizer used for classifier */
const gchar *backend; /**< name of statfile's backend */
ucl_object_t *opts; /**< other options */
GList *pre_callbacks; /**< list of callbacks that are called before classification */
GList *post_callbacks; /**< list of callbacks that are called after classification */
gchar *name; /**< unique name of classifier */
guint32 min_tokens; /**< minimal number of tokens to process classifier */
guint32 max_tokens; /**< maximum number of tokens */
};
struct rspamd_worker_bind_conf {
GPtrArray *addrs;
guint cnt;
gchar *name;
gboolean is_systemd;
struct rspamd_worker_bind_conf *next;
};
/**
* Config params for rspamd worker
*/
struct rspamd_worker_conf {
struct worker_s *worker; /**< pointer to worker type */
GQuark type; /**< type of worker */
struct rspamd_worker_bind_conf *bind_conf; /**< bind configuration */
guint16 count; /**< number of workers */
GList *listen_socks; /**< listening sockets desctiptors */
guint32 rlimit_nofile; /**< max files limit */
guint32 rlimit_maxcore; /**< maximum core file size */
GHashTable *params; /**< params for worker */
GQueue *active_workers; /**< linked list of spawned workers */
gboolean has_socket; /**< whether we should make listening socket in main process */
gpointer *ctx; /**< worker's context */
ucl_object_t *options; /**< other worker's options */
};
enum rspamd_log_format_type {
RSPAMD_LOG_STRING = 0,
RSPAMD_LOG_MID,
RSPAMD_LOG_QID,
RSPAMD_LOG_USER,
RSPAMD_LOG_ISSPAM,
RSPAMD_LOG_ACTION,
RSPAMD_LOG_SCORES,
RSPAMD_LOG_SYMBOLS,
RSPAMD_LOG_IP,
RSPAMD_LOG_LEN,
RSPAMD_LOG_DNS_REQ,
RSPAMD_LOG_SMTP_FROM,
RSPAMD_LOG_MIME_FROM,
RSPAMD_LOG_TIME_REAL,
RSPAMD_LOG_TIME_VIRTUAL,
RSPAMD_LOG_LUA
};
enum rspamd_log_format_flags {
RSPAMD_LOG_FLAG_DEFAULT = 0,
RSPAMD_LOG_FLAG_OPTIONAL = (1 << 0),
RSPAMD_LOG_FLAG_MIME_ALTERNATIVE = (1 << 1),
RSPAMD_LOG_FLAG_CONDITION = (1 << 2)
};
struct rspamd_log_format {
enum rspamd_log_format_type type;
guint flags;
gpointer data;
struct rspamd_log_format *prev, *next;
};
/**
* Structure that stores all config data
*/
struct rspamd_config {
gchar *rspamd_user; /**< user to run as */
gchar *rspamd_group; /**< group to run as */
rspamd_mempool_t *cfg_pool; /**< memory pool for config */
gchar *cfg_name; /**< name of config file */
gchar *pid_file; /**< name of pid file */
gchar *temp_dir; /**< dir for temp files */
gchar *control_socket_path; /**< path to the control socket */
#ifdef WITH_GPERF_TOOLS
gchar *profile_path;
#endif
gboolean no_fork; /**< if 1 do not call daemon() */
gboolean config_test; /**< if TRUE do only config file test */
gboolean raw_mode; /**< work in raw mode instead of utf one */
gboolean one_shot_mode; /**< rules add only one symbol */
gboolean check_text_attachements; /**< check text attachements as text */
gboolean convert_config; /**< convert config to XML format */
gboolean strict_protocol_headers; /**< strictly check protocol headers */
gboolean check_all_filters; /**< check all filters */
gsize max_diff; /**< maximum diff size for text parts */
enum rspamd_log_type log_type; /**< log type */
gint log_facility; /**< log facility in case of syslog */
gint log_level; /**< log level trigger */
gchar *log_file; /**< path to logfile in case of file logging */
gboolean log_buffered; /**< whether logging is buffered */
guint32 log_buf_size; /**< length of log buffer */
gchar *debug_ip_map; /**< turn on debugging for specified ip addresses */
gboolean log_urls; /**< whether we should log URLs */
GList *debug_symbols; /**< symbols to debug */
GHashTable *debug_modules; /**< logging modules to debug */
gboolean log_color; /**< output colors for console output */
gboolean log_extended; /**< log extended information */
gboolean log_systemd; /**< special case for systemd logger */
gboolean mlock_statfile_pool; /**< use mlock (2) for locking statfiles */
gboolean delivery_enable; /**< is delivery agent is enabled */
gchar *deliver_host; /**< host for mail deliviring */
struct in_addr deliver_addr; /**< its address */
guint16 deliver_port; /**< port for deliviring */
guint16 deliver_family; /**< socket family for delivirnig */
gchar *deliver_agent_path; /**< deliver to pipe instead of socket */
gboolean deliver_lmtp; /**< use LMTP instead of SMTP */
GList *script_modules; /**< linked list of script modules to load */
GHashTable *explicit_modules; /**< modules that should be always loaded */
GList *filters; /**< linked list of all filters */
GList *workers; /**< linked list of all workers params */
struct rspamd_worker_cfg_parser *wrk_parsers; /**< hash for worker config parsers, indexed by worker quarks */
ucl_object_t *rcl_obj; /**< rcl object */
GHashTable * metrics; /**< hash of metrics indexed by metric name */
GList * metrics_list; /**< linked list of metrics */
GHashTable * metrics_symbols; /**< hash table of metrics indexed by symbol */
GHashTable * c_modules; /**< hash of c modules indexed by module name */
GHashTable * composite_symbols; /**< hash of composite symbols indexed by its name */
GList *classifiers; /**< list of all classifiers defined */
GList *statfiles; /**< list of all statfiles in config file order */
GHashTable *classifiers_symbols; /**< hashtable indexed by symbol name of classifiers */
GHashTable * cfg_params; /**< all cfg params indexed by its name in this structure */
GList *pre_filters; /**< list of pre-processing lua filters */
GList *post_filters; /**< list of post-processing lua filters */
gchar *dynamic_conf; /**< path to dynamic configuration */
ucl_object_t *current_dynamic_conf; /**< currently loaded dynamic configuration */
GHashTable * domain_settings; /**< settings per-domains */
GHashTable * user_settings; /**< settings per-user */
gchar * domain_settings_str; /**< string representation of settings */
gchar * user_settings_str;
gint clock_res; /**< resolution of clock used */
GList *maps; /**< maps active */
rspamd_mempool_t *map_pool; /**< static maps pool */
gdouble map_timeout; /**< maps watch timeout */
struct symbols_cache *cache; /**< symbols cache object */
gchar *cache_filename; /**< filename of cache file */
struct metric *default_metric; /**< default metric */
gchar * checksum; /**< real checksum of config file */
gchar * dump_checksum; /**< dump checksum of config file */
gpointer lua_state; /**< pointer to lua state */
gchar * rrd_file; /**< rrd file to store statistics */
gchar * history_file; /**< file to save rolling history */
gchar * tld_file; /**< file to load effective tld list from */
gdouble dns_timeout; /**< timeout in milliseconds for waiting for dns reply */
guint32 dns_retransmits; /**< maximum retransmits count */
guint32 dns_throttling_errors; /**< maximum errors for starting resolver throttling */
guint32 dns_throttling_time; /**< time in seconds for DNS throttling */
guint32 dns_io_per_server; /**< number of sockets per DNS server */
GList *nameservers; /**< list of nameservers or NULL to parse resolv.conf */
guint32 dns_max_requests; /**< limit of DNS requests per task */
guint upstream_max_errors; /**< upstream max errors before shutting off */
gdouble upstream_error_time; /**< rate of upstream errors */
gdouble upstream_revive_time; /**< revive timeout for upstreams */
guint32 min_word_len; /**< minimum length of the word to be considered */
guint history_rows; /**< number of history rows stored */
GList *classify_headers; /**< list of headers using for statistics */
struct module_s **compiled_modules; /**< list of compiled C modules */
struct worker_s **compiled_workers; /**< list of compiled C modules */
struct rspamd_log_format *log_format; /**< parsed log format */
gchar *log_format_str; /**< raw log format string */
};
/**
* Parse bind credits
* @param cf config file to use
* @param str line that presents bind line
* @param type type of credits
* @return 1 if line was successfully parsed and 0 in case of error
*/
gboolean rspamd_parse_bind_line (struct rspamd_config *cfg,
struct rspamd_worker_conf *cf, const gchar *str);
/**
* Init default values
* @param cfg config file
*/
void rspamd_config_defaults (struct rspamd_config *cfg);
/**
* Free memory used by config structure
* @param cfg config file
*/
void rspamd_config_free (struct rspamd_config *cfg);
/**
* Gets module option with specified name
* @param cfg config file
* @param module_name name of module
* @param opt_name name of option to get
* @return module value or NULL if option does not defined
*/
const ucl_object_t * rspamd_config_get_module_opt (struct rspamd_config *cfg,
const gchar *module_name,
const gchar *opt_name);
/**
* Parse flag
* @param str string representation of flag (eg. 'on')
* @return numeric value of flag (0 or 1)
*/
gchar rspamd_config_parse_flag (const gchar *str, guint len);
/**
* Do post load actions for config
* @param cfg config file
*/
void rspamd_config_post_load (struct rspamd_config *cfg);
/**
* Calculate checksum for config file
* @param cfg config file
*/
gboolean rspamd_config_calculate_checksum (struct rspamd_config *cfg);
/**
* Replace all \" with a single " in given string
* @param line input string
*/
void rspamd_config_unescape_quotes (gchar *line);
/*
* Convert comma separated string to a list of strings
*/
GList * rspamd_config_parse_comma_list (rspamd_mempool_t *pool,
const gchar *line);
/*
* Return a new classifier_config structure, setting default and non-conflicting attributes
*/
struct rspamd_classifier_config * rspamd_config_new_classifier (
struct rspamd_config *cfg,
struct rspamd_classifier_config *c);
/*
* Return a new worker_conf structure, setting default and non-conflicting attributes
*/
struct rspamd_worker_conf * rspamd_config_new_worker (struct rspamd_config *cfg,
struct rspamd_worker_conf *c);
/*
* Return a new metric structure, setting default and non-conflicting attributes
*/
struct metric * rspamd_config_new_metric (struct rspamd_config *cfg,
struct metric *c, const gchar *name);
/*
* Return new symbols group definition
*/
struct rspamd_symbols_group * rspamd_config_new_group (
struct rspamd_config *cfg, struct metric *metric,
const gchar *name);
/*
* Return a new statfile structure, setting default and non-conflicting attributes
*/
struct rspamd_statfile_config * rspamd_config_new_statfile (
struct rspamd_config *cfg,
struct rspamd_statfile_config *c);
/*
* Read XML configuration file
*/
gboolean rspamd_config_read (struct rspamd_config *cfg,
const gchar *filename, const gchar *convert_to,
rspamd_rcl_section_fin_t logger_fin, gpointer logger_ud,
GHashTable *vars);
/*
* Register symbols of classifiers inside metrics
*/
void rspamd_config_insert_classify_symbols (struct rspamd_config *cfg);
/*
* Check statfiles inside a classifier
*/
gboolean rspamd_config_check_statfiles (struct rspamd_classifier_config *cf);
/*
* Find classifier config by name
*/
struct rspamd_classifier_config * rspamd_config_find_classifier (
struct rspamd_config *cfg,
const gchar *name);
void rspamd_ucl_add_conf_macros (struct ucl_parser *parser,
struct rspamd_config *cfg);
void rspamd_ucl_add_conf_variables (struct ucl_parser *parser, GHashTable *vars);
/**
* Initialize rspamd filtering system (lua and C filters)
* @param cfg
* @param reconfig
* @return
*/
gboolean rspamd_init_filters (struct rspamd_config *cfg, bool reconfig);
/**
* Init configuration file structure
* @param cfg
* @param init_lua
*/
void rspamd_init_cfg (struct rspamd_config *cfg, gboolean init_lua);
/**
* Add new symbol to the metric
* @param metric metric's name (or NULL for the default metric)
* @param symbol symbol's name
* @param score symbol's score
* @param description optional description
* @param group optional group name
* @param one_shot TRUE if symbol can add its score once
* @param rewrite_existing TRUE if we need to rewrite the existing symbol
* @return TRUE if symbol has been inserted or FALSE if `rewrite_existing` is not enabled and symbol already exists
*/
gboolean rspamd_config_add_metric_symbol (struct rspamd_config *cfg,
const gchar *metric,
const gchar *symbol, gdouble score, const gchar *description,
const gchar *group, gboolean one_shot, gboolean rewrite_existing);
/**
* Checks if a specified C or lua module is enabled or disabled in the config.
* The logic of check is the following:
*
* - For C modules, we check `filters` line and enable module only if it is found there
* - For LUA modules we check the corresponding configuration section:
* - if section exists, then we check `enabled` key and check its value
* - if section is absent, we consider module as disabled
* - For both C and LUA modules we check if the group with the module name is disabled in the default metric
* @param cfg config file
* @param module_name module name
* @return TRUE if a module is enabled
*/
gboolean rspamd_config_is_module_enabled (struct rspamd_config *cfg,
const gchar *module_name);
#define msg_err_config(...) rspamd_default_log_function (G_LOG_LEVEL_CRITICAL, \
cfg->cfg_pool->tag.tagname, cfg->checksum, \
G_STRFUNC, \
__VA_ARGS__)
#define msg_warn_config(...) rspamd_default_log_function (G_LOG_LEVEL_WARNING, \
cfg->cfg_pool->tag.tagname, cfg->checksum, \
G_STRFUNC, \
__VA_ARGS__)
#define msg_info_config(...) rspamd_default_log_function (G_LOG_LEVEL_INFO, \
cfg->cfg_pool->tag.tagname, cfg->checksum, \
G_STRFUNC, \
__VA_ARGS__)
#define msg_debug_config(...) rspamd_default_log_function (G_LOG_LEVEL_DEBUG, \
cfg->cfg_pool->tag.tagname, cfg->checksum, \
G_STRFUNC, \
__VA_ARGS__)
#endif /* ifdef CFG_FILE_H */
/*
* vi:ts=4
*/
|