commit 6244d64: [Minor] Neural: Allow to have flat classification if needed

Vsevolod Stakhov vsevolod at highsecure.ru
Thu Apr 29 18:49:03 UTC 2021


Author: Vsevolod Stakhov
Date: 2021-04-29 19:44:40 +0100
URL: https://github.com/rspamd/rspamd/commit/6244d64b43baa240d63528849a7a47b3f32eccc3 (HEAD -> master)

[Minor] Neural: Allow to have flat classification if needed

---
 lualib/plugins/neural.lua  |  1 +
 src/plugins/lua/neural.lua | 12 ++++++++++--
 2 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/lualib/plugins/neural.lua b/lualib/plugins/neural.lua
index f0d5cf582..557133591 100644
--- a/lualib/plugins/neural.lua
+++ b/lualib/plugins/neural.lua
@@ -57,6 +57,7 @@ local default_options = {
   -- Check ROC curve and AUC in the ML literature
   spam_score_threshold = nil, -- neural score threshold for spam (must be 0..1 or nil to disable)
   ham_score_threshold = nil, -- neural score threshold for ham (must be 0..1 or nil to disable)
+  flat_threshold_curve = false, -- use binary classification 0/1 when threshold is reached
   symbol_spam = 'NEURAL_SPAM',
   symbol_ham = 'NEURAL_HAM',
   max_inputs = nil, -- when PCA is used
diff --git a/src/plugins/lua/neural.lua b/src/plugins/lua/neural.lua
index ca11d9e66..2ac8df59f 100644
--- a/src/plugins/lua/neural.lua
+++ b/src/plugins/lua/neural.lua
@@ -121,7 +121,11 @@ local function ann_scores_filter(task)
         local result = score
 
         if not rule.spam_score_threshold or result >= rule.spam_score_threshold then
-          task:insert_result(rule.symbol_spam, result, symscore)
+          if rule.flat_threshold_curve then
+            task:insert_result(rule.symbol_spam, 1.0, symscore)
+          else
+            task:insert_result(rule.symbol_spam, result, symscore)
+          end
         else
           lua_util.debugm(N, task, '%s:%s:%s ann score: %s < %s (spam_score_threshold)',
               rule.prefix, set.name, set.ann.version, symscore,
@@ -131,7 +135,11 @@ local function ann_scores_filter(task)
         local result = -(score)
 
         if not rule.ham_score_threshold or result >= rule.ham_score_threshold then
-          task:insert_result(rule.symbol_ham, result, symscore)
+          if rule.flat_threshold_curve then
+            task:insert_result(rule.symbol_ham, 1.0, symscore)
+          else
+            task:insert_result(rule.symbol_ham, result, symscore)
+          end
         else
           lua_util.debugm(N, task, '%s:%s:%s ann score: %s < %s (ham_score_threshold)',
               rule.prefix, set.name, set.ann.version, result,


More information about the Commits mailing list