Mailing List Archive

svn commit: r1914079 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1
Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1914079&r1=1914078&r2=1914079&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Fri Nov 24 02:42:23 2023
@@ -9,87 +9,87 @@ score AC_HTML_NONSENSE_TAGS 1.9
score AC_POST_EXTRAS 2.499
score ADMITS_SPAM 2.599
score ADVANCE_FEE_2_NEW_MONEY 1.999
-score ADVANCE_FEE_3_NEW 3.267
-score ADVANCE_FEE_3_NEW_MONEY 0.001
-score ADVANCE_FEE_4_NEW_FRM_MNY 0.686
-score ADVANCE_FEE_4_NEW_MONEY 1.654
-score ADVANCE_FEE_5_NEW_FRM_MNY 0.597
-score ADVANCE_FEE_5_NEW_MONEY 2.419
+score ADVANCE_FEE_3_NEW 3.265
+score ADVANCE_FEE_3_NEW_MONEY 1.565
+score ADVANCE_FEE_4_NEW_FRM_MNY 0.902
+score ADVANCE_FEE_4_NEW_MONEY 1.650
+score ADVANCE_FEE_5_NEW_FRM_MNY 0.693
+score ADVANCE_FEE_5_NEW_MONEY 2.555
score AD_PREFS 0.001
score AMAZON_IMG_NOT_RCVD_AMZN 2.499
score AXB_XMAILER_MIMEOLE_OL_024C2 0.001
score BITCOIN_DEADLINE 2.999
-score BITCOIN_EXTORT_01 0.905
-score BITCOIN_EXTORT_02 2.304
-score BITCOIN_MALF_HTML 2.798
-score BITCOIN_ONAN 2.999
-score BITCOIN_PAY_ME 2.282
-score BITCOIN_SPAM_02 0.537
+score BITCOIN_EXTORT_01 1.025
+score BITCOIN_EXTORT_02 2.813
+score BITCOIN_MALF_HTML 2.927
+score BITCOIN_ONAN 2.972
+score BITCOIN_PAY_ME 2.455
+score BITCOIN_SPAM_02 0.426
score BITCOIN_SPAM_04 1.499
score BITCOIN_SPAM_05 0.001
score BITCOIN_SPAM_07 0.001
score BITCOIN_TOEQFM 3.499
score BITCOIN_VISTA 0.001
-score BITCOIN_XPRIO 2.500
-score BITCOIN_YOUR_INFO 1.258
+score BITCOIN_XPRIO 2.499
+score BITCOIN_YOUR_INFO 1.311
score BODY_SINGLE_WORD 0.898
-score BODY_URI_ONLY 2.545
-score BOGUS_MIME_VERSION 2.098
-score CK_HELO_GENERIC 0.250
+score BODY_URI_ONLY 2.541
+score BOGUS_MIME_VERSION 2.197
+score CK_HELO_GENERIC 0.249
score CTE_8BIT_MISMATCH 0.001
-score DEAR_BENEFICIARY 2.243
-score DKIMWL_WL_HIGH -0.088
+score DEAR_BENEFICIARY 2.247
+score DKIMWL_WL_HIGH -0.001
score DKIMWL_WL_MED -0.001 # force non-zero
-score DKIMWL_WL_MEDHI -0.001
+score DKIMWL_WL_MEDHI -0.001 # force non-zero
score END_FUTURE_EMAILS 2.499
score FACEBOOK_IMG_NOT_RCVD_FB 1.999
score FILL_THIS_FORM 0.899
-score FONT_INVIS_DIRECT 0.001
-score FONT_INVIS_LONG_LINE 2.498
+score FONT_INVIS_DIRECT 0.001 # force non-zero
+score FONT_INVIS_LONG_LINE 2.496
score FONT_INVIS_MSGID 0.552
-score FONT_INVIS_POSTEXTRAS 0.756
-score FORGED_SPF_HELO 1.799
+score FONT_INVIS_POSTEXTRAS 0.720
+score FORGED_SPF_HELO 1.699
score FORM_FRAUD_5 2.499
score FREEMAIL_FORGED_FROMDOMAIN 0.250
score FROMSPACE 2.399
-score FROM_ADDR_WS 1.048
+score FROM_ADDR_WS 1.046
score FROM_FMBLA_NEWDOM28 0.001
-score FROM_GOV_DKIM_AU -0.999
+score FROM_GOV_DKIM_AU -0.831
score FROM_IN_TO_AND_SUBJ 1.499
score FROM_MISSPACED 0.001
score FROM_MISSP_DYNIP 2.299
-score FROM_MISSP_EH_MATCH 1.999
+score FROM_MISSP_EH_MATCH 1.807
score FROM_MISSP_FREEMAIL 2.499
-score FROM_MISSP_MSFT 0.522
-score FROM_MISSP_REPLYTO 2.068
-score FROM_MISSP_SPF_FAIL 1.350
+score FROM_MISSP_MSFT 0.520
+score FROM_MISSP_REPLYTO 2.074
+score FROM_MISSP_SPF_FAIL 1.597
score FROM_MISSP_USER 0.001
-score FROM_PAYPAL_SPOOF 0.318
+score FROM_PAYPAL_SPOOF 0.001
score FROM_SUSPICIOUS_NTLD 0.499
-score FROM_SUSPICIOUS_NTLD_FP 0.333
+score FROM_SUSPICIOUS_NTLD_FP 0.338
score FROM_WSP_TRAIL 2.399
-score FSL_BULK_SIG 0.938
+score FSL_BULK_SIG 0.939
score FSL_CTYPE_WIN1251 0.001
score FSL_HAS_TINYURL 1.799
-score FSL_HELO_FAKE 1.386
+score FSL_HELO_FAKE 1.295
score FSL_NEW_HELO_USER 0.001
score FUZZY_BITCOIN 0.001
score FUZZY_WALLET 1.799
score GB_BITCOIN_CP 0.001
score GB_CUSTOM_HTM_URI 1.499
-score GB_FAKE_RF_SHORT 1.149
+score GB_FAKE_RF_SHORT 1.130
score GB_FREEMAIL_DISPTO 0.001
-score GB_HASHBL_BTC 1.530
+score GB_HASHBL_BTC 1.528
score GOOG_REDIR_HTML_ONLY 1.999
score GOOG_STO_IMG_HTML 2.999
-score GOOG_STO_NOIMG_HTML 2.975
+score GOOG_STO_NOIMG_HTML 1.886
score HAS_X_OUTGOING_SPAM_STAT 0.001
score HDRS_LCASE_IMGONLY 0.099
score HDRS_MISSP 2.499
score HDR_ORDER_FTSDMCXX_DIRECT 0.001
score HDR_ORDER_FTSDMCXX_NORDNS 0.001
score HEADER_FROM_DIFFERENT_DOMAINS 0.250
-score HELO_MISC_IP 0.249
+score HELO_MISC_IP 0.250
score HELO_NO_DOMAIN 0.001
score HK_NAME_FM_MR_MRS 1.499
score HK_NAME_MR_MRS 0.999
@@ -97,108 +97,108 @@ score HK_RANDOM_ENVFROM 0.9
score HK_RANDOM_FROM 0.999
score HK_RANDOM_REPLYTO 0.999
score HK_SCAM 1.999
-score HOSTED_IMG_DIRECT_MX 3.156
-score HOSTED_IMG_FREEM 2.614
-score HOSTED_IMG_MULTI_PUB_01 2.999
-score HREF_EMPTY_PHPMAIL 2.499
-score HTML_BADATTR 0.999
-score HTML_ENTITY_ASCII_TINY 2.998
-score HTML_FONT_TINY_NORDNS 1.054
+score HOSTED_IMG_DIRECT_MX 2.950
+score HOSTED_IMG_FREEM 2.617
+score HOSTED_IMG_MULTI_PUB_01 3.000
+score HREF_EMPTY_PHPMAIL 2.500
+score HTML_BADATTR 0.667
+score HTML_ENTITY_ASCII_TINY 2.689
+score HTML_FONT_TINY_NORDNS 1.362
score HTML_SINGLET_MANY 2.499
score HTML_TEXT_INVISIBLE_FONT 1.999
-score HTML_TEXT_INVISIBLE_STYLE 2.210
+score HTML_TEXT_INVISIBLE_STYLE 1.850
score JH_SPAMMY_HEADERS 3.499
-score KHOP_HELO_FCRDNS 0.001
+score KHOP_HELO_FCRDNS 0.001 # force non-zero
score LONGLN_LOW_CONTRAST 2.499
-score LONG_HEX_URI 2.800
-score LONG_IMG_URI 2.999
-score LONG_INVISIBLE_TEXT 2.678
+score LONG_HEX_URI 2.797
+score LONG_IMG_URI 2.939
+score LONG_INVISIBLE_TEXT 2.694
score LOTS_OF_MONEY 0.010
score LOTTO_DEPT 1.999
score MALFORMED_FREEMAIL 3.199
-score MALWARE_NORDNS 2.403
-score MALW_ATTACH 2.399
+score MALWARE_NORDNS 2.742
+score MALW_ATTACH 2.400
score MANY_SPAN_IN_TEXT 2.299
score MANY_SUBDOM 2.299
-score MILLION_HUNDRED 0.001
-score MILLION_USD 0.001
+score MILLION_HUNDRED 0.001 # force non-zero
+score MILLION_USD 0.001 # force non-zero
score MIMEOLE_DIRECT_TO_MX 0.001
-score MIME_NO_TEXT 0.523
+score MIME_NO_TEXT 1.670
score MIXED_ES 2.299
-score MIXED_HREF_CASE 1.999
-score MONEY_ATM_CARD 0.294
-score MONEY_FORM 1.493
+score MIXED_HREF_CASE 2.000
+score MONEY_ATM_CARD 0.493
+score MONEY_FORM 1.400
score MONEY_FORM_SHORT 2.499
-score MONEY_FRAUD_3 1.656
+score MONEY_FRAUD_3 1.803
score MONEY_FRAUD_5 0.001
score MONEY_FRAUD_8 0.001
-score MONEY_FREEMAIL_REPTO 2.220
+score MONEY_FREEMAIL_REPTO 2.088
score MONEY_FROM_MISSP 0.001
score NA_DOLLARS 1.499
-score NICE_REPLY_A -2.933
-score NORDNS_LOW_CONTRAST 1.840
-score NO_FM_NAME_IP_HOSTN 0.036
+score NICE_REPLY_A -1.592
+score NORDNS_LOW_CONTRAST 1.774
+score NO_FM_NAME_IP_HOSTN 0.039
score NSL_RCVD_FROM_USER 0.001
-score NSL_RCVD_HELO_USER 0.339
-score NUMBERONLY_BITCOIN_EXP 1.742
+score NSL_RCVD_HELO_USER 0.407
+score NUMBERONLY_BITCOIN_EXP 1.766
score OBFU_BITCOIN 0.001 # force non-zero
score OBFU_TEXT_ATTACH 1.599
-score ODD_FREEM_REPTO 2.448
+score ODD_FREEM_REPTO 2.447
score PDS_BAD_THREAD_QP_64 0.999
-score PDS_BTC_ID 0.500
+score PDS_BTC_ID 0.499
score PDS_BTC_MSGID 0.001
-score PDS_FRNOM_TODOM_NAKED_TO 1.499
-score PDS_FROM_2_EMAILS 2.579
+score PDS_FRNOM_TODOM_NAKED_TO 1.500
+score PDS_FROM_2_EMAILS 2.577
score PDS_FROM_NAME_TO_DOMAIN 1.999
score PDS_HELO_SPF_FAIL 1.999
score PDS_HP_HELO_NORDNS 0.001
-score PDS_NAKED_TO_NUMERO 1.999
+score PDS_NAKED_TO_NUMERO 1.594
score PHP_SCRIPT 2.499
-score PP_MIME_FAKE_ASCII_TEXT 0.001 # force non-zero
+score PP_MIME_FAKE_ASCII_TEXT 0.001
score RAND_MKTG_HEADER 1.999
score RATWARE_NO_RDNS 0.001
-score RCVD_IN_MSPIKE_H2 -0.001 # force non-zero
-score SCC_BODY_SINGLE_WORD 0.001 # force non-zero
-score SCC_CANSPAM_2 2.999
+score RCVD_IN_MSPIKE_H2 -0.001
+score SCC_BODY_SINGLE_WORD 0.001
+score SCC_CANSPAM_2 2.899
score SCC_ISEMM_LID_1B 1.499
-score SENDGRID_REDIR 1.010
+score SENDGRID_REDIR 1.033
score SHOPIFY_IMG_NOT_RCVD_SFY 2.499
-score SHORTENER_SHORT_IMG 1.395
-score SHORT_SHORTNER 1.999
-score SPOOFED_FREEMAIL 0.001
+score SHORTENER_SHORT_IMG 1.397
+score SHORT_SHORTNER 2.000
+score SPOOFED_FREEMAIL 0.001 # force non-zero
score SPOOFED_FREEMAIL_NO_RDNS 0.001
-score SPOOFED_FREEM_REPTO 0.785
-score STATIC_XPRIO_OLE 1.266
-score STOX_BOUND_090909_B 0.921
+score SPOOFED_FREEM_REPTO 0.827
+score STATIC_XPRIO_OLE 1.265
+score STOX_BOUND_090909_B 0.793
score SUBJ_ATTENTION 0.499
score TEQF_USR_POLITE 1.999
score THIS_AD 1.099
-score TO_EQ_FM_DIRECT_MX 2.499
-score TO_EQ_FM_DOM_SPF_FAIL 0.870
+score TO_EQ_FM_DIRECT_MX 2.500
+score TO_EQ_FM_DOM_SPF_FAIL 0.829
score TO_EQ_FM_SPF_FAIL 0.001
-score TO_IN_SUBJ 0.099
-score TO_NO_BRKTS_FROM_MSSP 2.499
+score TO_IN_SUBJ 0.100
+score TO_NO_BRKTS_FROM_MSSP 2.500
score TO_NO_BRKTS_HTML_IMG 1.999
score TO_NO_BRKTS_HTML_ONLY 1.999
-score TO_NO_BRKTS_MSFT 2.228
+score TO_NO_BRKTS_MSFT 2.233
score TO_NO_BRKTS_NORDNS_HTML 1.999
-score TO_NO_BRKTS_PCNT 1.639
+score TO_NO_BRKTS_PCNT 1.640
score TVD_SPACE_RATIO_MINFP 0.001
score UNDISC_FREEM 2.599
score UNDISC_MONEY 2.799
-score UNICODE_OBFU_ZW_MANY 2.820
-score URI_DOTEDU 1.180
-score URI_GOOGLE_PROXY 2.199
+score UNICODE_OBFU_ZW_MANY 2.821
+score URI_DOTEDU 0.231
+score URI_GOOGLE_PROXY 2.099
score URI_IN_URI_5 3.199
-score URI_PHISH 1.626
-score URI_PHP_REDIR 2.823
+score URI_PHISH 1.627
+score URI_PHP_REDIR 2.818
score URI_TRY_3LD 1.999
score URI_WPADMIN 2.299
-score URI_WP_HACKED_2 2.499
+score URI_WP_HACKED_2 2.500
score VFY_ACCT_NORDNS 2.999
-score VISTA_COST 2.216
+score VISTA_COST 2.383
score VISTA_TONOM_EQ_TOLOC 2.499
-score WORD_INVIS 1.898
+score WORD_INVIS 1.895
score WORD_INVIS_MANY 2.999
score XFER_LOTSA_MONEY 0.001
score XM_RANDOM 2.499
@@ -277,7 +277,6 @@ score GAPPY_SALES_LEADS_FREEM 1.0
score GB_FORGED_MUA_POSTFIX 1.000
score GB_FREEMAIL_DISPTO_NOTFREEM 0.500
score GB_GOOGLE_OBFUR 0.750
-score GB_STORAGE_GOOGLE_EMAIL 1.000
score GOOGLE_DOCS_PHISH 1.000
score GOOGLE_DOCS_PHISH_MANY 1.000
score GOOGLE_DOC_SUSP 1.000

Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1914079&r1=1914078&r2=1914079&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Fri Nov 24 02:42:23 2023
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 426795 58.178% (99.318% of non-spam corpus)
-# Correctly spam: 206508 28.150% (67.958% of spam corpus)
-# False positives: 2929 0.399% (0.682% of nonspam, 62003 weighted)
-# False negatives: 97367 13.273% (32.042% of spam, 204023 weighted)
-# Average score for spam: 7.8 nonspam: 0.5
-# Average for false-pos: 6.0 false-neg: 2.1
-# TOTAL: 733599 100.00%
+# Correctly non-spam: 430175 60.867% (99.310% of non-spam corpus)
+# Correctly spam: 184303 26.078% (67.367% of spam corpus)
+# False positives: 2990 0.423% (0.690% of nonspam, 56564 weighted)
+# False negatives: 89277 12.632% (32.633% of spam, 181074 weighted)
+# Average score for spam: 7.6 nonspam: 0.6
+# Average for false-pos: 6.0 false-neg: 2.0
+# TOTAL: 706745 100.00%

Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 53177 99.28%
-# Correctly spam: 24174 63.73%
-# False positives: 384 0.72%
-# False negatives: 13755 36.27%
-# TCR(l=50): 1.150933 SpamRecall: 63.735% SpamPrec: 98.436%
+# Correctly non-spam: 53598 99.30%
+# Correctly spam: 21666 63.36%
+# False positives: 379 0.70%
+# False negatives: 12530 36.64%
+# TCR(l=50): 1.086277 SpamRecall: 63.358% SpamPrec: 98.281%

##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 418555 97.40%
-# Correctly spam: 114338 37.63%
-# False positives: 11169 2.60%
-# False negatives: 189537 62.37%
-# TCR(l=50): 0.406257 SpamRecall: 37.627% SpamPrec: 91.101%
+# Correctly non-spam: 421899 97.40%
+# Correctly spam: 106168 38.81%
+# False positives: 11266 2.60%
+# False negatives: 167412 61.19%
+# TCR(l=50): 0.374402 SpamRecall: 38.807% SpamPrec: 90.407%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 52164 97.39%
-# Correctly spam: 14363 37.87%
-# False positives: 1397 2.61%
-# False negatives: 23566 62.13%
-# TCR(l=50): 0.406023 SpamRecall: 37.868% SpamPrec: 91.136%
+# Correctly non-spam: 52556 97.37%
+# Correctly spam: 13225 38.67%
+# False positives: 1421 2.63%
+# False negatives: 20971 61.33%
+# TCR(l=50): 0.371611 SpamRecall: 38.674% SpamPrec: 90.298%

Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1914079&r1=1914078&r2=1914079&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Fri Nov 24 02:42:23 2023
@@ -1,23 +1,23 @@
##### WITH NEW RULES AND SCORES #####

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 401186 85.184% (99.448% of non-spam corpus)
-# Correctly spam: 27276 5.792% (40.378% of spam corpus)
-# False positives: 2227 0.473% (0.552% of nonspam, 23815 weighted)
-# False negatives: 40276 8.552% (59.622% of spam, 45787 weighted)
-# Average score for spam: 6.4 nonspam: -0.9
+# Correctly non-spam: 401176 85.182% (99.445% of non-spam corpus)
+# Correctly spam: 27340 5.805% (40.474% of spam corpus)
+# False positives: 2237 0.475% (0.555% of nonspam, 23905 weighted)
+# False negatives: 40210 8.538% (59.526% of spam, 45524 weighted)
+# Average score for spam: 6.4 nonspam: -0.8
# Average for false-pos: 6.4 false-neg: 1.1
-# TOTAL: 470965 100.00%
+# TOTAL: 470963 100.00%

Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 50093 99.52%
-# Correctly spam: 3445 40.43%
-# False positives: 243 0.48%
-# False negatives: 5076 59.57%
-# TCR(l=50): 0.494659 SpamRecall: 40.430% SpamPrec: 93.411%
+# Correctly non-spam: 50101 99.53%
+# Correctly spam: 3435 40.31%
+# False positives: 235 0.47%
+# False negatives: 5086 59.69%
+# TCR(l=50): 0.506118 SpamRecall: 40.312% SpamPrec: 93.597%

##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
@@ -25,16 +25,16 @@ Reading per-message hit stat logs and sc

# SUMMARY for threshold 5.0:
# Correctly non-spam: 402119 99.68%
-# Correctly spam: 15130 22.40%
+# Correctly spam: 15151 22.43%
# False positives: 1294 0.32%
-# False negatives: 52422 77.60%
-# TCR(l=50): 0.576766 SpamRecall: 22.398% SpamPrec: 92.121%
+# False negatives: 52399 77.57%
+# TCR(l=50): 0.576862 SpamRecall: 22.429% SpamPrec: 92.131%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
# Correctly non-spam: 50167 99.66%
-# Correctly spam: 1950 22.88%
+# Correctly spam: 1947 22.85%
# False positives: 169 0.34%
-# False negatives: 6571 77.12%
-# TCR(l=50): 0.567272 SpamRecall: 22.885% SpamPrec: 92.025%
+# False negatives: 6574 77.15%
+# TCR(l=50): 0.567159 SpamRecall: 22.849% SpamPrec: 92.013%