You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

rspamd.h 12KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385
  1. /*-
  2. * Copyright 2016-2017 Vsevolod Stakhov
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #ifndef RSPAMD_MAIN_H
  17. #define RSPAMD_MAIN_H
  18. #include "config.h"
  19. #include "libutil/fstring.h"
  20. #include "libutil/mem_pool.h"
  21. #include "libutil/util.h"
  22. #include "libserver/logger.h"
  23. #include "libserver/http/http_connection.h"
  24. #include "libutil/upstream.h"
  25. #include "libutil/radix.h"
  26. #include "libserver/cfg_file.h"
  27. #include "libserver/url.h"
  28. #include "libserver/protocol.h"
  29. #include "libserver/async_session.h"
  30. #include "libserver/roll_history.h"
  31. #include "libserver/task.h"
  32. #include <openssl/ssl.h>
  33. /* Default values */
  34. #define FIXED_CONFIG_FILE RSPAMD_CONFDIR "/rspamd.conf"
  35. /* Time in seconds to exit for old worker */
  36. #define SOFT_SHUTDOWN_TIME 10
  37. /* Spam subject */
  38. #define SPAM_SUBJECT "*** SPAM *** %s"
  39. #ifdef CRLF
  40. #undef CRLF
  41. #undef CR
  42. #undef LF
  43. #endif
  44. #define CRLF "\r\n"
  45. #define CR '\r'
  46. #define LF '\n'
  47. #ifdef __cplusplus
  48. extern "C" {
  49. #endif
  50. struct rspamd_main;
  51. enum rspamd_worker_flags {
  52. RSPAMD_WORKER_HAS_SOCKET = (1 << 0),
  53. RSPAMD_WORKER_UNIQUE = (1 << 1),
  54. RSPAMD_WORKER_THREADED = (1 << 2),
  55. RSPAMD_WORKER_KILLABLE = (1 << 3),
  56. RSPAMD_WORKER_ALWAYS_START = (1 << 4),
  57. RSPAMD_WORKER_SCANNER = (1 << 5),
  58. RSPAMD_WORKER_CONTROLLER = (1 << 6),
  59. RSPAMD_WORKER_NO_TERMINATE_DELAY = (1 << 7),
  60. };
  61. struct rspamd_worker_accept_event {
  62. ev_io accept_ev;
  63. ev_timer throttling_ev;
  64. struct ev_loop *event_loop;
  65. struct rspamd_worker_accept_event *prev, *next;
  66. };
  67. typedef void (*rspamd_worker_term_cb) (EV_P_ ev_child *, struct rspamd_main *,
  68. struct rspamd_worker *);
  69. struct rspamd_worker_heartbeat {
  70. ev_timer heartbeat_ev; /**< used by main for checking heartbeats and by workers to send heartbeats */
  71. ev_tstamp last_event; /**< last heartbeat received timestamp */
  72. gint64 nbeats; /**< positive for beats received, negative for beats missed */
  73. };
  74. enum rspamd_worker_state {
  75. rspamd_worker_state_running = 0,
  76. rspamd_worker_state_terminating,
  77. rspamd_worker_wait_connections,
  78. rspamd_worker_wait_final_scripts,
  79. rspamd_worker_wanna_die
  80. };
  81. /**
  82. * Worker process structure
  83. */
  84. struct rspamd_worker {
  85. pid_t pid; /**< pid of worker */
  86. pid_t ppid; /**< pid of parent */
  87. guint index; /**< index number */
  88. guint nconns; /**< current connections count */
  89. enum rspamd_worker_state state; /**< current worker state */
  90. gboolean cores_throttled; /**< set to true if cores throttling took place */
  91. gdouble start_time; /**< start time */
  92. struct rspamd_main *srv; /**< pointer to server structure */
  93. GQuark type; /**< process type */
  94. GHashTable *signal_events; /**< signal events */
  95. struct rspamd_worker_accept_event *accept_events; /**< socket events */
  96. struct rspamd_worker_conf *cf; /**< worker config data */
  97. gpointer ctx; /**< worker's specific data */
  98. gint flags; /**< worker's flags (enum rspamd_worker_flags) */
  99. gint control_pipe[2]; /**< control pipe. [0] is used by main process,
  100. [1] is used by a worker */
  101. gint srv_pipe[2]; /**< used by workers to request something from the
  102. main process. [0] - main, [1] - worker */
  103. ev_io srv_ev; /**< used by main for read workers' requests */
  104. struct rspamd_worker_heartbeat hb; /**< heartbeat data */
  105. gpointer control_data; /**< used by control protocol to handle commands */
  106. gpointer tmp_data; /**< used to avoid race condition to deal with control messages */
  107. ev_child cld_ev; /**< to allow reaping */
  108. rspamd_worker_term_cb term_handler; /**< custom term handler */
  109. };
  110. struct rspamd_abstract_worker_ctx {
  111. guint64 magic;
  112. /* Events base */
  113. struct ev_loop *event_loop;
  114. /* DNS resolver */
  115. struct rspamd_dns_resolver *resolver;
  116. /* Config */
  117. struct rspamd_config *cfg;
  118. char data[];
  119. };
  120. struct rspamd_worker_signal_handler;
  121. typedef gboolean (*rspamd_worker_signal_cb_t) (
  122. struct rspamd_worker_signal_handler *, void *ud);
  123. struct rspamd_worker_signal_handler_elt {
  124. rspamd_worker_signal_cb_t handler;
  125. void *handler_data;
  126. struct rspamd_worker_signal_handler_elt *next, *prev;
  127. };
  128. struct rspamd_worker_signal_handler {
  129. gint signo;
  130. gboolean enabled;
  131. ev_signal ev_sig;
  132. struct ev_loop *event_loop;
  133. struct rspamd_worker *worker;
  134. struct rspamd_worker_signal_handler_elt *cb;
  135. };
  136. /**
  137. * Common structure representing C module context
  138. */
  139. struct module_s;
  140. struct module_ctx {
  141. gint (*filter) (struct rspamd_task *task); /**< pointer to headers process function */
  142. struct module_s *mod; /**< module pointer */
  143. gboolean enabled; /**< true if module is enabled in configuration */
  144. };
  145. #ifndef WITH_HYPERSCAN
  146. #define RSPAMD_FEATURE_HYPERSCAN "0"
  147. #else
  148. #define RSPAMD_FEATURE_HYPERSCAN "1"
  149. #endif
  150. #ifndef WITH_PCRE2
  151. #define RSPAMD_FEATURE_PCRE2 "0"
  152. #else
  153. #define RSPAMD_FEATURE_PCRE2 "1"
  154. #endif
  155. #ifndef WITH_FANN
  156. #define RSPAMD_FEATURE_FANN "0"
  157. #else
  158. #define RSPAMD_FEATURE_FANN "1"
  159. #endif
  160. #ifndef WITH_SNOWBALL
  161. #define RSPAMD_FEATURE_SNOWBALL "0"
  162. #else
  163. #define RSPAMD_FEATURE_SNOWBALL "1"
  164. #endif
  165. #define RSPAMD_CUR_MODULE_VERSION 0x1
  166. #define RSPAMD_CUR_WORKER_VERSION 0x2
  167. #define RSPAMD_FEATURES \
  168. RSPAMD_FEATURE_HYPERSCAN RSPAMD_FEATURE_PCRE2 \
  169. RSPAMD_FEATURE_FANN RSPAMD_FEATURE_SNOWBALL
  170. #define RSPAMD_MODULE_VER \
  171. RSPAMD_CUR_MODULE_VERSION, /* Module version */ \
  172. RSPAMD_VERSION_NUM, /* Rspamd version */ \
  173. RSPAMD_FEATURES /* Compilation features */ \
  174. #define RSPAMD_WORKER_VER \
  175. RSPAMD_CUR_WORKER_VERSION, /* Worker version */ \
  176. RSPAMD_VERSION_NUM, /* Rspamd version */ \
  177. RSPAMD_FEATURES /* Compilation features */ \
  178. /**
  179. * Module
  180. */
  181. typedef struct module_s {
  182. const gchar *name;
  183. int (*module_init_func) (struct rspamd_config *cfg, struct module_ctx **ctx);
  184. int (*module_config_func) (struct rspamd_config *cfg);
  185. int (*module_reconfig_func) (struct rspamd_config *cfg);
  186. int (*module_attach_controller_func) (struct module_ctx *ctx,
  187. GHashTable *custom_commands);
  188. guint module_version;
  189. guint64 rspamd_version;
  190. const gchar *rspamd_features;
  191. guint ctx_offset;
  192. } module_t;
  193. enum rspamd_worker_socket_type {
  194. RSPAMD_WORKER_SOCKET_NONE = 0,
  195. RSPAMD_WORKER_SOCKET_TCP = (1 << 0),
  196. RSPAMD_WORKER_SOCKET_UDP = (1 << 1),
  197. };
  198. struct rspamd_worker_listen_socket {
  199. const rspamd_inet_addr_t *addr;
  200. gint fd;
  201. enum rspamd_worker_socket_type type;
  202. };
  203. typedef struct worker_s {
  204. const gchar *name;
  205. gpointer (*worker_init_func) (struct rspamd_config *cfg);
  206. void (*worker_start_func) (struct rspamd_worker *worker);
  207. int flags;
  208. int listen_type;
  209. guint worker_version;
  210. guint64 rspamd_version;
  211. const gchar *rspamd_features;
  212. } worker_t;
  213. /**
  214. * Check if loaded worker is compatible with rspamd
  215. * @param cfg
  216. * @param wrk
  217. * @return
  218. */
  219. gboolean rspamd_check_worker (struct rspamd_config *cfg, worker_t *wrk);
  220. /**
  221. * Check if loaded module is compatible with rspamd
  222. * @param cfg
  223. * @param wrk
  224. * @return
  225. */
  226. gboolean rspamd_check_module (struct rspamd_config *cfg, module_t *wrk);
  227. struct pidfh;
  228. struct rspamd_config;
  229. struct tokenizer;
  230. struct rspamd_stat_classifier;
  231. struct rspamd_classifier_config;
  232. struct rspamd_mime_part;
  233. struct rspamd_dns_resolver;
  234. struct rspamd_task;
  235. struct rspamd_cryptobox_library_ctx;
  236. /**
  237. * Server statistics
  238. */
  239. struct rspamd_stat {
  240. guint messages_scanned; /**< total number of messages scanned */
  241. guint actions_stat[METRIC_ACTION_MAX]; /**< statistic for each action */
  242. guint connections_count; /**< total connections count */
  243. guint control_connections_count; /**< connections count to control interface */
  244. guint messages_learned; /**< messages learned */
  245. };
  246. /**
  247. * Struct that determine main server object (for logging purposes)
  248. */
  249. struct rspamd_main {
  250. struct rspamd_config *cfg; /**< pointer to config structure */
  251. pid_t pid; /**< main pid */
  252. /* Pid file structure */
  253. rspamd_pidfh_t *pfh; /**< struct pidfh for pidfile */
  254. GQuark type; /**< process type */
  255. struct rspamd_stat *stat; /**< pointer to statistics */
  256. rspamd_mempool_t *server_pool; /**< server's memory pool */
  257. rspamd_mempool_mutex_t *start_mtx; /**< server is starting up */
  258. GHashTable *workers; /**< workers pool indexed by pid */
  259. GHashTable *spairs; /**< socket pairs requested by workers */
  260. rspamd_logger_t *logger;
  261. uid_t workers_uid; /**< worker's uid running to */
  262. gid_t workers_gid; /**< worker's gid running to */
  263. gboolean is_privilleged; /**< true if run in privilleged mode */
  264. gboolean wanna_die; /**< no respawn of processes */
  265. gboolean cores_throttling; /**< turn off cores when limits are exceeded */
  266. struct roll_history *history; /**< rolling history */
  267. struct ev_loop *event_loop;
  268. ev_signal term_ev, int_ev, hup_ev, usr1_ev; /**< signals */
  269. struct rspamd_http_context *http_ctx;
  270. };
  271. enum rspamd_exception_type {
  272. RSPAMD_EXCEPTION_NEWLINE = 0,
  273. RSPAMD_EXCEPTION_URL,
  274. RSPAMD_EXCEPTION_GENERIC,
  275. };
  276. /**
  277. * Structure to point exception in text from processing
  278. */
  279. struct rspamd_process_exception {
  280. goffset pos;
  281. guint len;
  282. gpointer ptr;
  283. enum rspamd_exception_type type;
  284. };
  285. /**
  286. * Control session object
  287. */
  288. struct controller_command;
  289. struct controller_session;
  290. typedef gboolean (*controller_func_t) (gchar **args,
  291. struct controller_session *session);
  292. struct controller_session {
  293. struct rspamd_worker *worker; /**< pointer to worker structure (controller in fact) */
  294. gint sock; /**< socket descriptor */
  295. struct controller_command *cmd; /**< real command */
  296. struct rspamd_config *cfg; /**< pointer to config file */
  297. GList *parts; /**< extracted mime parts */
  298. struct rspamd_async_session *s; /**< async session object */
  299. struct rspamd_dns_resolver *resolver; /**< DNS resolver */
  300. struct ev_loop *ev_base; /**< Event base */
  301. };
  302. struct zstd_dictionary {
  303. void *dict;
  304. gsize size;
  305. guint id;
  306. };
  307. struct rspamd_radix_map_helper;
  308. struct rspamd_external_libs_ctx {
  309. struct rspamd_radix_map_helper **local_addrs;
  310. struct rspamd_cryptobox_library_ctx *crypto_ctx;
  311. struct ottery_config *ottery_cfg;
  312. SSL_CTX *ssl_ctx;
  313. SSL_CTX *ssl_ctx_noverify;
  314. struct zstd_dictionary *in_dict;
  315. struct zstd_dictionary *out_dict;
  316. void *out_zstream;
  317. void *in_zstream;
  318. ref_entry_t ref;
  319. };
  320. /**
  321. * Register custom controller function
  322. */
  323. void register_custom_controller_command (const gchar *name,
  324. controller_func_t handler,
  325. gboolean privilleged,
  326. gboolean require_message);
  327. #ifdef __cplusplus
  328. }
  329. #endif
  330. #endif