]> source.dussan.org Git - rspamd.git/commitdiff
[Minor] Langdet: Exclude exceptions (e.g. urls)
authorVsevolod Stakhov <vsevolod@highsecure.ru>
Fri, 2 Aug 2019 17:28:11 +0000 (18:28 +0100)
committerVsevolod Stakhov <vsevolod@highsecure.ru>
Fri, 2 Aug 2019 17:28:11 +0000 (18:28 +0100)
src/libmime/lang_detection.c

index 276771778a694566fb610af7c1e0cf30b3fa16d0..74c6f7247df4f386bc937d148829622d5c9522a1 100644 (file)
@@ -939,6 +939,7 @@ rspamd_language_detector_random_select (GArray *ucs_tokens, guint nwords,
                        /* Filter bad tokens */
 
                        if (tok->unicode.len >= 2 &&
+                                       !(tok->flags & RSPAMD_STAT_TOKEN_FLAG_EXCEPTION) &&
                                        u_isalpha (tok->unicode.begin[0]) &&
                                        u_isalpha (tok->unicode.begin[tok->unicode.len - 1])) {
                                offsets_out[out_idx] = sel;