From: Vsevolod Stakhov Date: Tue, 6 Apr 2021 14:39:19 +0000 (+0100) Subject: [Minor] Disable headers hash for statistics X-Git-Tag: 3.0~521 X-Git-Url: http://git.ipfire.org/gitweb.cgi?a=commitdiff_plain;h=d07edfa195c7e166cee4b30e7dea6c17a12e169b;p=thirdparty%2Frspamd.git [Minor] Disable headers hash for statistics Discussed with: @moisseev --- diff --git a/lualib/lua_stat.lua b/lualib/lua_stat.lua index 2606a8d22d..920f20205c 100644 --- a/lualib/lua_stat.lua +++ b/lualib/lua_stat.lua @@ -678,6 +678,10 @@ local function get_mime_stat_tokens(task, res, i) end local function get_headers_stat_tokens(task, cf, res, i) + --[[ + -- As discussed with Alexander Moisseev, this feature can skew statistics + -- especially when learning is separated from scanning, so learning + -- has a different set of tokens where this token can have too high weight local hdrs_cksum = task:get_mempool():get_variable("headers_hash") if hdrs_cksum then @@ -686,6 +690,7 @@ local function get_headers_stat_tokens(task, cf, res, i) res[i]) i = i + 1 end + ]]-- for k,hdrs in pairs(cf.classify_headers_parsed) do for _,hname in ipairs(hdrs) do