aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--src/libstat/classifiers/bayes.c33
-rw-r--r--src/libstat/tokenizers/osb.c5
2 files changed, 27 insertions, 11 deletions
diff --git a/src/libstat/classifiers/bayes.c b/src/libstat/classifiers/bayes.c
index 730581ced..aa6899d06 100644
--- a/src/libstat/classifiers/bayes.c
+++ b/src/libstat/classifiers/bayes.c
@@ -156,15 +156,30 @@ bayes_classify_token (struct rspamd_classifier *ctx,
cl->ham_prob += log2 (bayes_ham_prob);
cl->processed_tokens ++;
- msg_debug_bayes ("token: weight: %f, total_count: %L, "
- "spam_count: %L, ham_count: %L,"
- "spam_prob: %.3f, ham_prob: %.3f, "
- "bayes_spam_prob: %.3f, bayes_ham_prob: %.3f, "
- "current spam prob: %.3f, current ham prob: %.3f",
- fw, total_count, spam_count, ham_count,
- spam_prob, ham_prob,
- bayes_spam_prob, bayes_ham_prob,
- cl->spam_prob, cl->ham_prob);
+ if (tok->t1 && tok->t2) {
+ msg_debug_bayes ("token <%*s:%*s>: weight: %f, total_count: %L, "
+ "spam_count: %L, ham_count: %L,"
+ "spam_prob: %.3f, ham_prob: %.3f, "
+ "bayes_spam_prob: %.3f, bayes_ham_prob: %.3f, "
+ "current spam prob: %.3f, current ham prob: %.3f",
+ (int) tok->t1->len, tok->t1->begin,
+ (int) tok->t2->len, tok->t2->begin,
+ fw, total_count, spam_count, ham_count,
+ spam_prob, ham_prob,
+ bayes_spam_prob, bayes_ham_prob,
+ cl->spam_prob, cl->ham_prob);
+ }
+ else {
+ msg_debug_bayes ("token <?:?>: weight: %f, total_count: %L, "
+ "spam_count: %L, ham_count: %L,"
+ "spam_prob: %.3f, ham_prob: %.3f, "
+ "bayes_spam_prob: %.3f, bayes_ham_prob: %.3f, "
+ "current spam prob: %.3f, current ham prob: %.3f",
+ fw, total_count, spam_count, ham_count,
+ spam_prob, ham_prob,
+ bayes_spam_prob, bayes_ham_prob,
+ cl->spam_prob, cl->ham_prob);
+ }
}
}
diff --git a/src/libstat/tokenizers/osb.c b/src/libstat/tokenizers/osb.c
index 7c8da26f3..8d1742cc1 100644
--- a/src/libstat/tokenizers/osb.c
+++ b/src/libstat/tokenizers/osb.c
@@ -346,8 +346,9 @@ rspamd_tokenizer_osb (struct rspamd_stat_ctx *ctx,
if (processed < window_size) {
/* Just fill a hashpipe */
- hashpipe[window_size - ++processed].h = cur;
- hashpipe[window_size - ++processed].t = token;
+ ++processed;
+ hashpipe[window_size - processed].h = cur;
+ hashpipe[window_size - processed].t = token;
}
else {
/* Shift hashpipe */