if (w->stemmed.len <= 3) {
short_len++;
}
- }
- if (w->flags & RSPAMD_STAT_TOKEN_FLAG_TEXT) {
- part->nwords ++;
+ if (w->flags & RSPAMD_STAT_TOKEN_FLAG_TEXT) {
+ part->nwords ++;
+ }
}
if (w->flags & (RSPAMD_STAT_TOKEN_FLAG_BROKEN_UNICODE|
GByteArray *utf_content; /* utf8 encoded processed content */
GByteArray *utf_raw_content; /* utf raw content */
GByteArray *utf_stripped_content; /* utf content with no newlines */
- GArray *normalized_hashes;
- GArray *utf_words;
+ GArray *normalized_hashes; /* Array of guint64 */
+ GArray *utf_words; /* Array of rspamd_stat_token_t */
UText utf_stripped_text; /* Used by libicu to represent the utf8 content */
GPtrArray *newlines; /**< positions of newlines in text, relative to content*/