Mailing List Archive

svn commit: r1881603 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1
Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1881603&r1=1881602&r2=1881603&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Thu Sep 10 03:23:25 2020
@@ -4,179 +4,170 @@
score AC_BR_BONANZA 0.001
score AC_DIV_BONANZA 0.001 # force non-zero
score AC_FROM_MANY_DOTS 2.999
-score AC_HTML_NONSENSE_TAGS 1.999
+score AC_HTML_NONSENSE_TAGS 2.000
score AC_POST_EXTRAS 0.001
-score ADVANCE_FEE_2_NEW_MONEY 1.999
-score ADVANCE_FEE_3_NEW 3.256
+score ADVANCE_FEE_2_NEW_MONEY 1.551
+score ADVANCE_FEE_3_NEW 3.189
score ADVANCE_FEE_3_NEW_MONEY 2.699
-score ADVANCE_FEE_5_NEW 2.108
-score ADVANCE_FEE_5_NEW_FRM_MNY 0.001
-score ADVANCE_FEE_5_NEW_MONEY 0.001
-score AXB_XMAILER_MIMEOLE_OL_024C2 3.738
-score BITCOIN_EXTORT_01 4.999
+score ADVANCE_FEE_5_NEW 2.605
+score AXB_XMAILER_MIMEOLE_OL_024C2 3.500
+score BITCOIN_EXTORT_01 4.670
score BITCOIN_SPAM_02 2.499
-score BITCOIN_SPAM_05 2.500
-score BITCOIN_SPAM_08 0.650
-score BITCOIN_SPAM_09 0.774
-score BODY_SINGLE_URI 2.500
+score BITCOIN_SPAM_05 2.499
+score BITCOIN_SPAM_08 0.398
+score BITCOIN_SPAM_09 1.028
score BODY_URI_ONLY 0.999
-score BOGUS_MIME_VERSION 2.926
-score CK_HELO_DYNAMIC_SPLIT_IP 0.200
-score CK_HELO_GENERIC 0.249
+score BOGUS_MIME_VERSION 2.800
+score CK_HELO_DYNAMIC_SPLIT_IP 1.233
+score CK_HELO_GENERIC 0.250
score CTE_8BIT_MISMATCH 0.999
-score CTYPE_NULL 2.899
+score CTYPE_NULL 2.900
score DKIMWL_BL 2.999
-score DKIMWL_WL_HIGH -0.001 # force non-zero
-score DKIMWL_WL_MED -0.001 # force non-zero
+score DKIMWL_WL_HIGH -0.001
+score DKIMWL_WL_MED -0.001
score DOTGOV_IMAGE 2.999
score DSN_NO_MIMEVERSION 1.999
-score DX_TEXT_03 0.900
+score DX_TEXT_03 0.899
score END_FUTURE_EMAILS 2.499
-score FILL_THIS_FORM 0.242
-score FONT_INVIS_DIRECT 0.001 # force non-zero
-score FONT_INVIS_DOTGOV 0.001
+score FILL_THIS_FORM 0.071
+score FONT_INVIS_DIRECT 0.001
+score FONT_INVIS_DOTGOV 0.001 # force non-zero
score FONT_INVIS_LONG_LINE 0.001
score FONT_INVIS_MSGID 0.001
-score FONT_INVIS_POSTEXTRAS 1.473
+score FONT_INVIS_POSTEXTRAS 1.474
score FORGED_RELAY_MUA_TO_MX 3.899
-score FORGED_SPF_HELO 1.122
+score FORGED_SPF_HELO 1.121
score FORM_FRAUD_5 2.899
score FREEMAIL_FORGED_FROMDOMAIN 0.250
score FROM_2_EMAILS_SHORT 0.001
-score FROM_ADDR_WS 0.001
+score FROM_ADDR_WS 0.362
score FROM_FMBLA_NEWDOM 1.499
-score FROM_FMBLA_NEWDOM14 0.999
-score FROM_FMBLA_NEWDOM28 0.800
-score FROM_GOV_DKIM_AU -0.446
-score FROM_GOV_SPOOF 0.267
-score FROM_MISSPACED 1.347
-score FROM_MISSP_DYNIP 0.374
-score FROM_MISSP_EH_MATCH 1.764
-score FROM_MISSP_FREEMAIL 1.739
-score FROM_MISSP_MSFT 2.924
-score FROM_MISSP_REPLYTO 2.499
+score FROM_FMBLA_NEWDOM14 1.000
+score FROM_FMBLA_NEWDOM28 0.799
+score FROM_GOV_DKIM_AU -0.447
+score FROM_GOV_SPOOF 0.999
+score FROM_MISSPACED 0.001
+score FROM_MISSP_DYNIP 1.535
+score FROM_MISSP_EH_MATCH 0.001
+score FROM_MISSP_FREEMAIL 1.393
+score FROM_MISSP_MSFT 0.001 # force non-zero
+score FROM_MISSP_REPLYTO 2.389
score FROM_MISSP_SPF_FAIL 1.999
-score FROM_MISSP_USER 2.816
-score FROM_MISSP_XPRIO 0.146
-score FROM_NTLD_REPLY_FREEMAIL 1.999
+score FROM_MISSP_USER 0.001
+score FROM_MISSP_XPRIO 0.001
+score FROM_NTLD_REPLY_FREEMAIL 1.787
score FROM_SUSPICIOUS_NTLD 0.499
-score FROM_SUSPICIOUS_NTLD_FP 1.564
+score FROM_SUSPICIOUS_NTLD_FP 1.563
score FSL_BULK_SIG 0.001
-score FSL_CTYPE_WIN1251 2.751
-score FSL_HELO_FAKE 1.800
-score FSL_NEW_HELO_USER 1.647
-score GB_BITCOIN_NH 1.312
-score GB_FREEMAIL_DISPTO 0.001
+score FSL_CTYPE_WIN1251 0.001
+score FSL_NEW_HELO_USER 0.001
+score GB_BITCOIN_NH 2.279
+score GB_FREEMAIL_DISPTO 0.001 # force non-zero
score GB_GOOGLE_OBFUS 0.749
-score HDRS_LCASE 0.100
-score HDRS_LCASE_IMGONLY 0.100
+score HDRS_LCASE 0.099
+score HDRS_LCASE_IMGONLY 0.099
score HDR_ORDER_FTSDMCXX_DIRECT 1.999
-score HDR_ORDER_FTSDMCXX_NORDNS 2.530
-score HEADER_FROM_DIFFERENT_DOMAINS 0.250
+score HDR_ORDER_FTSDMCXX_NORDNS 3.499
+score HEADER_FROM_DIFFERENT_DOMAINS 0.249
score HELO_MISC_IP 0.174
score HELO_NO_DOMAIN 0.001
-score HK_NAME_FM_MR_MRS 0.517
-score HK_RANDOM_FROM 0.768
+score HK_RANDOM_FROM 0.999
score HK_RANDOM_REPLYTO 0.999
-score HK_SCAM 0.977
+score HK_SCAM 1.798
score HOSTED_IMG_FREEM 3.499
-score HOSTED_IMG_MULTI 0.605
+score HOSTED_IMG_MULTI 1.967
score HTML_SINGLET_MANY 2.499
score HTML_TEXT_INVISIBLE_FONT 2.999
-score HTML_TEXT_INVISIBLE_STYLE 1.629
-score IMG_ONLY_FM_DOM_INFO 2.499
-score KB_FORGED_MOZ4 3.833
-score KHOP_FAKE_EBAY 0.555
-score KHOP_HELO_FCRDNS 0.400
+score HTML_TEXT_INVISIBLE_STYLE 1.986
+score IMG_ONLY_FM_DOM_INFO 2.444
+score KB_FORGED_MOZ4 4.499
+score KHOP_FAKE_EBAY 0.540
+score KHOP_HELO_FCRDNS 0.399
score LIST_PRTL_SAME_USER 0.001
score LONG_HEX_URI 0.001
-score LOTS_OF_MONEY 0.009
-score MANY_SPAN_IN_TEXT 3.090
+score LOTS_OF_MONEY 0.010
+score MANY_SPAN_IN_TEXT 2.590
score MAY_BE_FORGED 2.295
-score MILLION_HUNDRED 1.701
+score MILLION_HUNDRED 2.186
score MIMEOLE_DIRECT_TO_MX 1.999
-score MIME_NO_TEXT 0.001
-score MIXED_ES 1.392
-score MONERO_EXTORT_01 2.379
+score MIME_NO_TEXT 0.001 # force non-zero
+score MIXED_ES 1.246
+score MONERO_EXTORT_01 2.406
score MONEY_FORM_SHORT 2.499
-score MONEY_FRAUD_3 2.499
-score MONEY_FRAUD_5 0.765
-score MONEY_FRAUD_8 0.849
-score MONEY_FROM_MISSP 1.999
-score MSM_PRIO_REPTO 2.172
-score NICE_REPLY_A -3.576
+score MONEY_FRAUD_3 2.364
+score MONEY_FRAUD_5 0.784
+score MONEY_FRAUD_8 1.023
+score MONEY_FROM_MISSP 0.428
+score MSM_PRIO_REPTO 0.777
+score NICE_REPLY_A -0.326
score NORDNS_LOW_CONTRAST 0.912
-score NO_FM_NAME_IP_HOSTN 1.666
-score NSL_RCVD_FROM_USER 2.889
-score NSL_RCVD_HELO_USER 1.418
-score OFFER_ONLY_AMERICA 1.783
-score PDS_BTC_ID 0.499
+score NO_FM_NAME_IP_HOSTN 1.753
+score NSL_RCVD_FROM_USER 0.001
+score NSL_RCVD_HELO_USER 1.842
+score OFFER_ONLY_AMERICA 1.886
+score PDS_BTC_ID 0.500
score PDS_BTC_MSGID 0.999
score PDS_EMPTYSUBJ_URISHRT 0.001
score PDS_FREEMAIL_REPLYTO_URISHRT 1.499
score PDS_FRNOM_TODOM_NAKED_TO 1.499
-score PDS_FROM_2_EMAILS 1.048
+score PDS_FROM_2_EMAILS 0.716
score PDS_FROM_NAME_TO_DOMAIN 0.999
score PDS_NAKED_TO_NUMERO 1.999
-score PDS_RDNS_DYNAMIC_FP 0.001
score PDS_SHORTFWD_URISHRT 1.499
-score PDS_TINYSUBJ_URISHRT 1.109
+score PDS_TINYSUBJ_URISHRT 0.226
score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 1.999
-score PDS_TONAME_EQ_TOLOCAL_HDRS_LCASE 1.999
-score PDS_TONAME_EQ_TOLOCAL_SHORT 1.999
+score PDS_TONAME_EQ_TOLOCAL_HDRS_LCASE 0.398
score PDS_TONAME_EQ_TOLOCAL_VSHORT 0.999
score PDS_TO_EQ_FROM_NAME 0.001
-score PP_MIME_FAKE_ASCII_TEXT 0.112
-score RATWARE_NO_RDNS 2.880
+score PP_MIME_FAKE_ASCII_TEXT 0.195
+score RATWARE_NO_RDNS 2.534
score RCVD_IN_MSPIKE_H2 -0.001
-score SENDGRID_REDIR 3.281
+score SENDGRID_REDIR 3.499
score SERGIO_SUBJECT_VIAGRA01 3.799
-score SHORTENED_URL_SRC 2.839
-score SHORTENER_SHORT_IMG 2.499
+score SHORTENED_URL_SRC 2.835
+score SHORTENER_SHORT_IMG 1.045
score SHORT_SHORTNER 1.999
-score SHORT_URL 0.894
+score SHORT_URL 1.120
score SINGLETS_LOW_CONTRAST 0.001
-score SPOOFED_FREEMAIL 1.997
+score SPOOFED_FREEMAIL 1.999
score SPOOFED_FREEMAIL_NO_RDNS 0.001
-score SPOOFED_FREEM_REPTO 1.999
-score SPOOFED_FREEM_REPTO_CHN 2.399
-score SPOOFED_URL 1.177
-score SPOOFED_URL_HOST 1.112
-score STATIC_XPRIO_OLE 1.999
-score STOCK_LOW_CONTRAST 0.712
+score SPOOFED_FREEM_REPTO 1.998
+score SPOOFED_FREEM_REPTO_CHN 1.661
+score STATIC_XPRIO_OLE 2.000
+score STOCK_LOW_CONTRAST 0.001
score SUBJ_OBFU_PUNCT_FEW 0.001
-score SUBJ_OBFU_PUNCT_MANY 0.200
-score SUSP_UTF8_WORD_FROM 1.999
+score SUBJ_OBFU_PUNCT_MANY 1.315
+score SUSP_UTF8_WORD_COMBO 0.001
+score SUSP_UTF8_WORD_FROM 2.000
score SUSP_UTF8_WORD_SUBJ 1.999
-score THIS_AD 1.300
-score TONOM_EQ_TOLOC_SHRT_PSHRTNER 0.012
-score TONOM_EQ_TOLOC_SHRT_SHRTNER 1.500
-score TO_EQ_FM_DOM_HTML_IMG 0.058
-score TO_EQ_FM_DOM_HTML_ONLY 1.557
+score THIS_AD 1.299
+score TONOM_EQ_TOLOC_SHRT_PSHRTNER 0.364
+score TONOM_EQ_TOLOC_SHRT_SHRTNER 1.499
+score TO_EQ_FM_DOM_HTML_IMG 0.135
+score TO_EQ_FM_DOM_HTML_ONLY 1.547
score TO_EQ_FM_DOM_SPF_FAIL 0.001
-score TO_EQ_FM_HTML_ONLY 2.006
-score TO_EQ_FM_SPF_FAIL 0.001 # force non-zero
-score TO_IN_SUBJ 0.099
-score TO_NO_BRKTS_DYNIP 1.167
+score TO_EQ_FM_HTML_ONLY 1.940
+score TO_EQ_FM_SPF_FAIL 0.001
+score TO_IN_SUBJ 0.100
score TO_NO_BRKTS_FROM_MSSP 2.499
-score TO_NO_BRKTS_HTML_IMG 1.705
+score TO_NO_BRKTS_HTML_IMG 1.999
score TO_NO_BRKTS_HTML_ONLY 1.999
-score TO_NO_BRKTS_MSFT 2.499
-score TO_NO_BRKTS_NORDNS_HTML 1.999
-score TVD_RCVD_SPACE_BRACKET 3.904
+score TO_NO_BRKTS_MSFT 1.053
+score TO_NO_BRKTS_NORDNS_HTML 2.000
+score TVD_RCVD_SPACE_BRACKET 4.399
score TVD_SPACE_ENCODED 0.001
-score TVD_SPACE_RATIO_MINFP 1.878
-score UPGRADE_MAILBOX 0.468
+score TVD_SPACE_RATIO_MINFP 1.641
+score UPGRADE_MAILBOX 0.828
score URI_DOTEDU 0.001
-score URI_GOOGLE_PROXY 2.315
-score URI_IMG_WP_REDIR 1.498
-score URI_IN_URI_10 1.301
-score URI_IN_URI_5 1.280
+score URI_GOOGLE_PROXY 1.889
+score URI_IMG_WP_REDIR 2.931
+score URI_IN_URI_10 3.414
+score URI_IN_URI_5 1.450
score URI_PHP_REDIR 3.499
score URI_TRY_3LD 1.999
score URI_WP_DIRINDEX 3.499
-score URI_WP_HACKED_2 2.499
-score XPRIO_SHORT_SUBJ 2.363
+score URI_WP_HACKED_2 1.702
+score XPRIO_SHORT_SUBJ 2.499
score XPRIO_URL_SHORTNER 0.999
score AC_SPAMMY_URI_PATTERNS1 1.000
score AC_SPAMMY_URI_PATTERNS10 1.000

Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1881603&r1=1881602&r2=1881603&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Thu Sep 10 03:23:25 2020
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 180287 13.446% (99.515% of non-spam corpus)
-# Correctly spam: 1017053 75.852% (87.702% of spam corpus)
-# False positives: 879 0.066% (0.485% of nonspam, 162822 weighted)
-# False negatives: 142617 10.636% (12.298% of spam, 321754 weighted)
-# Average score for spam: 11.9 nonspam: 0.8
-# Average for false-pos: 5.8 false-neg: 2.3
-# TOTAL: 1340836 100.00%
+# Correctly non-spam: 845103 42.024% (99.764% of non-spam corpus)
+# Correctly spam: 862142 42.871% (74.073% of spam corpus)
+# False positives: 1999 0.099% (0.236% of nonspam, 89006 weighted)
+# False negatives: 301769 15.006% (25.927% of spam, 756915 weighted)
+# Average score for spam: 9.0 nonspam: 0.5
+# Average for false-pos: 6.5 false-neg: 2.5
+# TOTAL: 2011013 100.00%

Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 22562 99.16%
-# Correctly spam: 127393 88.01%
-# False positives: 190 0.84%
-# False negatives: 17354 11.99%
-# TCR(l=50): 5.390147 SpamRecall: 88.011% SpamPrec: 99.851%
+# Correctly non-spam: 105294 99.70%
+# Correctly spam: 107939 74.31%
+# False positives: 321 0.30%
+# False negatives: 37322 25.69%
+# TCR(l=50): 2.721671 SpamRecall: 74.307% SpamPrec: 99.703%

##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 172618 95.28%
-# Correctly spam: 419407 36.17%
-# False positives: 8548 4.72%
-# False negatives: 740263 63.83%
-# TCR(l=50): 0.993155 SpamRecall: 36.166% SpamPrec: 98.003%
+# Correctly non-spam: 838015 98.93%
+# Correctly spam: 421069 36.18%
+# False positives: 9087 1.07%
+# False negatives: 742842 63.82%
+# TCR(l=50): 0.972201 SpamRecall: 36.177% SpamPrec: 97.888%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 21668 95.24%
-# Correctly spam: 52522 36.29%
-# False positives: 1084 4.76%
-# False negatives: 92225 63.71%
-# TCR(l=50): 0.988540 SpamRecall: 36.285% SpamPrec: 97.978%
+# Correctly non-spam: 104468 98.91%
+# Correctly spam: 52546 36.17%
+# False positives: 1147 1.09%
+# False negatives: 92715 63.83%
+# TCR(l=50): 0.967987 SpamRecall: 36.174% SpamPrec: 97.864%

Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1881603&r1=1881602&r2=1881603&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Thu Sep 10 03:23:25 2020
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 424032 26.729% (99.613% of non-spam corpus)
-# Correctly spam: 1096085 69.092% (94.430% of spam corpus)
-# False positives: 1649 0.104% (0.387% of nonspam, 310945 weighted)
-# False negatives: 64650 4.075% (5.570% of spam, 118908 weighted)
-# Average score for spam: 16.0 nonspam: -1.4
+# Correctly non-spam: 424058 26.732% (99.620% of non-spam corpus)
+# Correctly spam: 1093780 68.949% (94.236% of spam corpus)
+# False positives: 1619 0.102% (0.380% of nonspam, 306320 weighted)
+# False negatives: 66902 4.217% (5.764% of spam, 123359 weighted)
+# Average score for spam: 15.5 nonspam: -1.4
# Average for false-pos: 6.9 false-neg: 1.8
-# TOTAL: 1586416 100.00%
+# TOTAL: 1586359 100.00%

Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 52852 99.62%
-# Correctly spam: 136985 94.55%
-# False positives: 204 0.38%
-# False negatives: 7894 5.45%
-# TCR(l=50): 8.007019 SpamRecall: 94.551% SpamPrec: 99.851%
+# Correctly non-spam: 52848 99.61%
+# Correctly spam: 136715 94.37%
+# False positives: 207 0.39%
+# False negatives: 8157 5.63%
+# TCR(l=50): 7.827957 SpamRecall: 94.370% SpamPrec: 99.849%

##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 423140 99.40%
-# Correctly spam: 700810 60.38%
-# False positives: 2541 0.60%
-# False negatives: 459925 39.62%
-# TCR(l=50): 1.977486 SpamRecall: 60.376% SpamPrec: 99.639%
+# Correctly non-spam: 423139 99.40%
+# Correctly spam: 700698 60.37%
+# False positives: 2538 0.60%
+# False negatives: 459984 39.63%
+# TCR(l=50): 1.977703 SpamRecall: 60.370% SpamPrec: 99.639%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 52743 99.41%
-# Correctly spam: 87488 60.39%
-# False positives: 313 0.59%
-# False negatives: 57391 39.61%
-# TCR(l=50): 1.983530 SpamRecall: 60.387% SpamPrec: 99.644%
+# Correctly non-spam: 52729 99.39%
+# Correctly spam: 87483 60.39%
+# False positives: 326 0.61%
+# False negatives: 57389 39.61%
+# TCR(l=50): 1.965992 SpamRecall: 60.386% SpamPrec: 99.629%