Mailing List Archive

svn commit: r1915099 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1
Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1915099&r1=1915098&r2=1915099&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Sat Jan 6 02:44:31 2024
@@ -5,192 +5,192 @@ score ACCT_PHISHING_MANY 2.9
score AC_BR_BONANZA 0.001
score AC_DIV_BONANZA 0.001
score AC_HTML_NONSENSE_TAGS 1.997
-score AC_POST_EXTRAS 1.586
+score AC_POST_EXTRAS 1.337
score ADMITS_SPAM 1.697
score ADVANCE_FEE_2_NEW_MONEY 1.997
score ADVANCE_FEE_3_NEW 3.496
-score ADVANCE_FEE_3_NEW_MONEY 0.980
+score ADVANCE_FEE_3_NEW_MONEY 0.938
score ADVANCE_FEE_4_NEW_MONEY 2.397
score ADVANCE_FEE_5_NEW_FRM_MNY 0.001
-score ADVANCE_FEE_5_NEW_MONEY 1.645
-score AD_PREFS 0.192
-score AMAZON_IMG_NOT_RCVD_AMZN 2.498
+score ADVANCE_FEE_5_NEW_MONEY 1.687
+score AD_PREFS 0.016
+score AMAZON_IMG_NOT_RCVD_AMZN 2.497
score AXB_XMAILER_MIMEOLE_OL_024C2 0.001
score AXB_X_FF_SEZ_S 2.996
-score BITCOIN_EXTORT_01 2.321
+score BITCOIN_EXTORT_01 2.005
score BITCOIN_MALF_HTML 0.001
score BITCOIN_SPAM_02 2.497
-score BITCOIN_SPAM_05 2.468
-score BITCOIN_SPAM_07 1.288
-score BITCOIN_SPAM_08 0.188
+score BITCOIN_SPAM_05 2.271
+score BITCOIN_SPAM_07 0.830
+score BITCOIN_SPAM_08 0.473
score BITCOIN_TOEQFM 0.001
score BITCOIN_VISTA 0.001
-score BITCOIN_XPRIO 0.804
+score BITCOIN_XPRIO 0.948
score BITCOIN_YOUR_INFO 2.996
-score BODY_SINGLE_URI 0.037
+score BODY_SINGLE_URI 0.067
score BODY_SINGLE_WORD 0.001
score BODY_URI_ONLY 0.001
-score CK_HELO_GENERIC 0.248
-score CTE_8BIT_MISMATCH 0.001 # force non-zero
+score CK_HELO_GENERIC 0.249
+score CTE_8BIT_MISMATCH 0.001
score DEAR_BENEFICIARY 2.896
-score DKIMWL_WL_HIGH -2.679
+score DKIMWL_WL_HIGH -2.540
score DKIMWL_WL_MED -0.001
score DKIMWL_WL_MEDHI -0.001
-score DYNAMIC_IMGUR 1.391
+score DYNAMIC_IMGUR 2.331
score END_FUTURE_EMAILS 2.497
-score FILL_THIS_FORM 0.075
-score FONT_INVIS_DIRECT 0.001
+score FILL_THIS_FORM 0.071
+score FONT_INVIS_DIRECT 0.001 # force non-zero
score FONT_INVIS_LONG_LINE 2.996
-score FONT_INVIS_MSGID 1.024
-score FONT_INVIS_NORDNS 1.650
-score FONT_INVIS_POSTEXTRAS 2.224
+score FONT_INVIS_MSGID 1.039
+score FONT_INVIS_NORDNS 0.739
+score FONT_INVIS_POSTEXTRAS 2.473
score FORGED_SPF_HELO 3.096
score FORM_FRAUD 0.998
-score FORM_FRAUD_5 1.975
+score FORM_FRAUD_5 0.888
score FREEMAIL_FORGED_FROMDOMAIN 0.248
score FROM_ADDR_WS 2.996
score FROM_FMBLA_NEWDOM28 0.798
-score FROM_GOV_DKIM_AU -0.529
-score FROM_IN_TO_AND_SUBJ 1.012
+score FROM_GOV_DKIM_AU -0.244
+score FROM_IN_TO_AND_SUBJ 0.001
score FROM_MISSPACED 1.997
-score FROM_MISSP_DYNIP 0.433
+score FROM_MISSP_DYNIP 0.434
score FROM_MISSP_EH_MATCH 0.001
-score FROM_MISSP_FREEMAIL 1.488
-score FROM_MISSP_MSFT 1.626
-score FROM_MISSP_REPLYTO 1.390
+score FROM_MISSP_FREEMAIL 1.493
+score FROM_MISSP_MSFT 1.350
+score FROM_MISSP_REPLYTO 1.296
score FROM_MISSP_SPF_FAIL 1.997
-score FROM_MISSP_TO_UNDISC 3.086
+score FROM_MISSP_TO_UNDISC 4.099
score FROM_MISSP_USER 0.001
-score FROM_MISSP_XPRIO 0.953
-score FROM_PAYPAL_SPOOF 0.610
-score FROM_SUSPICIOUS_NTLD 0.498
+score FROM_MISSP_XPRIO 0.938
+score FROM_PAYPAL_SPOOF 0.001
+score FROM_SUSPICIOUS_NTLD 0.499
score FROM_SUSPICIOUS_NTLD_FP 1.997
score FSL_BULK_SIG 0.001
score FSL_CTYPE_WIN1251 0.001
score FSL_NEW_HELO_USER 0.001
-score FUZZY_AMAZON 1.864
-score FUZZY_BITCOIN 0.844
-score FUZZY_IMPORTANT 0.483
+score FUZZY_AMAZON 2.498
+score FUZZY_BITCOIN 1.728
+score FUZZY_IMPORTANT 1.145
score FUZZY_WALLET 1.897
-score GB_BITCOIN_CP 1.270
+score GB_BITCOIN_CP 1.922
score GB_CUSTOM_HTM_URI 1.498
-score GB_FAKE_RF_SHORT 1.142
+score GB_FAKE_RF_SHORT 1.124
score GB_FREEMAIL_DISPTO 0.001
-score GB_HASHBL_BTC 1.349
-score GOOG_REDIR_NORDNS 0.123
+score GB_HASHBL_BTC 1.473
+score GOOG_REDIR_NORDNS 0.115
score GOOG_STO_IMG_HTML 2.996
-score GOOG_STO_NOIMG_HTML 2.999
-score HDRS_LCASE_IMGONLY 0.098
+score GOOG_STO_NOIMG_HTML 2.740
+score HDRS_LCASE_IMGONLY 0.099
score HDRS_MISSP 2.497
score HDR_ORDER_FTSDMCXX_DIRECT 0.001
score HDR_ORDER_FTSDMCXX_NORDNS 0.001
-score HEADER_FROM_DIFFERENT_DOMAINS 0.249
+score HEADER_FROM_DIFFERENT_DOMAINS 0.248
score HELO_MISC_IP 0.248
score HELO_NO_DOMAIN 0.001
score HK_NAME_FM_MR_MRS 1.498
score HK_NAME_MR_MRS 0.998
score HK_RANDOM_ENVFROM 0.998
-score HK_RANDOM_FROM 0.998
-score HK_RANDOM_REPLYTO 0.938
+score HK_RANDOM_FROM 0.999
+score HK_RANDOM_REPLYTO 0.951
score HK_SCAM 1.997
score HOSTED_IMG_DIRECT_MX 3.496
-score HOSTED_IMG_FREEM 3.031
-score HOSTED_IMG_MULTI_PUB_01 2.996
-score HTML_BADATTR 0.998
+score HOSTED_IMG_FREEM 3.011
+score HOSTED_IMG_MULTI_PUB_01 2.997
+score HTML_BADATTR 0.999
score HTML_FONT_TINY_NORDNS 0.001
score HTML_SINGLET_MANY 2.497
-score HTML_TEXT_INVISIBLE_FONT 1.535
-score HTML_TEXT_INVISIBLE_STYLE 1.775
+score HTML_TEXT_INVISIBLE_FONT 1.547
+score HTML_TEXT_INVISIBLE_STYLE 1.789
score JH_SPAMMY_HEADERS 3.496
-score KHOP_HELO_FCRDNS 0.001
+score KHOP_HELO_FCRDNS 0.001 # force non-zero
score LONG_HEX_URI 2.996
score LONG_IMG_URI 2.996
-score LONG_INVISIBLE_TEXT 2.678
+score LONG_INVISIBLE_TEXT 2.694
score LOTS_OF_MONEY 0.010
score LOTTO_DEPT 1.997
score MALFORMED_FREEMAIL 2.297
-score MILLION_HUNDRED 0.001
-score MILLION_USD 0.728
+score MILLION_HUNDRED 0.001 # force non-zero
+score MILLION_USD 0.446
score MIMEOLE_DIRECT_TO_MX 0.001
score MIXED_AREA_CASE 0.001
-score MIXED_CENTER_CASE 1.417
+score MIXED_CENTER_CASE 2.447
score MIXED_ES 2.097
score MIXED_HREF_CASE 1.997
score MIXED_IMG_CASE 0.001
-score MONEY_ATM_CARD 1.709
+score MONEY_ATM_CARD 0.872
score MONEY_FORM 0.001
score MONEY_FORM_SHORT 2.497
-score MONEY_FRAUD_3 1.450
+score MONEY_FRAUD_3 0.884
score MONEY_FRAUD_5 2.596
-score MONEY_FRAUD_8 1.904
-score MONEY_FREEMAIL_REPTO 1.752
+score MONEY_FRAUD_8 0.984
+score MONEY_FREEMAIL_REPTO 1.792
score MONEY_FROM_MISSP 0.001
score NA_DOLLARS 1.498
-score NICE_REPLY_A -1.854
-score NO_FM_NAME_IP_HOSTN 1.245
+score NICE_REPLY_A -2.919
+score NO_FM_NAME_IP_HOSTN 0.472
score NSL_RCVD_FROM_USER 0.001
-score NSL_RCVD_HELO_USER 0.067
-score OBFU_BITCOIN 1.929
+score NSL_RCVD_HELO_USER 0.383
+score OBFU_BITCOIN 1.092
score OBFU_TEXT_ATTACH 1.597
-score PDS_BAD_THREAD_QP_64 0.998
-score PDS_BTC_ID 0.045
-score PDS_BTC_MSGID 0.001 # force non-zero
+score PDS_BAD_THREAD_QP_64 0.999
+score PDS_BTC_ID 0.001 # force non-zero
+score PDS_BTC_MSGID 0.001
score PDS_EMPTYSUBJ_URISHRT 1.498
score PDS_FRNOM_TODOM_DBL_URL 0.001
-score PDS_FRNOM_TODOM_NAKED_TO 0.827
-score PDS_FROM_NAME_TO_DOMAIN 1.469
+score PDS_FRNOM_TODOM_NAKED_TO 1.313
+score PDS_FROM_NAME_TO_DOMAIN 0.990
score PDS_HELO_SPF_FAIL 1.997
score PDS_HP_HELO_NORDNS 0.001
score PDS_NAKED_TO_NUMERO 1.997
score PDS_TINYSUBJ_URISHRT 1.498
-score PHP_SCRIPT 1.297
+score PHP_SCRIPT 1.847
score PP_MIME_FAKE_ASCII_TEXT 0.001
-score RAND_MKTG_HEADER 1.998
-score RATWARE_NO_RDNS 1.835
-score RCVD_IN_MSPIKE_H2 -0.001
+score RAND_MKTG_HEADER 1.997
+score RATWARE_NO_RDNS 1.087
+score RCVD_IN_MSPIKE_H2 -0.001 # force non-zero
score SCC_BODY_SINGLE_WORD 0.001
-score SCC_BODY_URI_ONLY 2.321
-score SCC_CANSPAM_2 3.096
-score SCC_ISEMM_LID_1B 0.875
-score SCC_SPAMMER_ADDR_2 0.001
-score SENDGRID_REDIR 0.325
+score SCC_BODY_URI_ONLY 2.316
+score SCC_CANSPAM_2 3.097
+score SCC_ISEMM_LID_1B 0.937
+score SCC_SPAMMER_ADDR_2 2.491
+score SENDGRID_REDIR 0.341
score SHOPIFY_IMG_NOT_RCVD_SFY 2.497
score SHORTENED_URL_SRC 2.397
score SHORT_SHORTNER 1.997
score SPOOFED_FREEMAIL 0.001
score SPOOFED_FREEMAIL_NO_RDNS 0.001
score SPOOFED_FREEM_REPTO 1.123
-score STATIC_XPRIO_OLE 1.285
-score SUBJ_ATTENTION 0.086
+score STATIC_XPRIO_OLE 1.266
+score SUBJ_ATTENTION 0.499
score THIS_AD 0.598
-score TO_EQ_FM_DIRECT_MX 0.654
-score TO_EQ_FM_DOM_SPF_FAIL 0.619
-score TO_EQ_FM_HTML_ONLY 0.631
-score TO_EQ_FM_SPF_FAIL 0.183
-score TO_IN_SUBJ 0.098
-score TO_NAME_SUBJ_NO_RDNS 1.265
+score TO_EQ_FM_DIRECT_MX 1.245
+score TO_EQ_FM_DOM_SPF_FAIL 0.744
+score TO_EQ_FM_HTML_ONLY 0.815
+score TO_EQ_FM_SPF_FAIL 0.058
+score TO_IN_SUBJ 0.099
+score TO_NAME_SUBJ_NO_RDNS 2.974
score TO_NO_BRKTS_FROM_MSSP 2.497
-score TO_NO_BRKTS_HTML_IMG 1.897
+score TO_NO_BRKTS_HTML_IMG 1.888
score TO_NO_BRKTS_HTML_ONLY 1.997
-score TO_NO_BRKTS_MSFT 2.147
-score TO_NO_BRKTS_NORDNS_HTML 1.336
-score TO_NO_BRKTS_PCNT 2.378
-score TVD_SPACE_RATIO_MINFP 0.163
+score TO_NO_BRKTS_MSFT 2.173
+score TO_NO_BRKTS_NORDNS_HTML 1.419
+score TO_NO_BRKTS_PCNT 2.346
+score TVD_SPACE_RATIO_MINFP 0.157
score UNDISC_FREEM 2.596
score UNDISC_MONEY 2.796
-score UNICODE_OBFU_ZW_MANY 0.475
-score URI_DOTEDU 0.001
-score URI_GOOGLE_PROXY 1.697
+score UNICODE_OBFU_ZW_MANY 0.472
+score URI_DOTEDU 0.834
+score URI_GOOGLE_PROXY 1.698
score URI_PHISH 3.995
score URI_TRY_3LD 1.997
score URI_WP_HACKED 3.496
score URI_WP_HACKED_2 2.497
-score VISTA_TONOM_EQ_TOLOC 2.497
+score VISTA_TONOM_EQ_TOLOC 2.498
score WIKI_IMG 1.897
-score WORD_INVIS 2.044
+score WORD_INVIS 2.048
score WORD_INVIS_MANY 2.996
-score XFER_LOTSA_MONEY 0.001
-score XM_RANDOM 2.497
+score XFER_LOTSA_MONEY 0.001 # force non-zero
+score XM_RANDOM 2.498
score XPRIO 0.001
score AC_FROM_MANY_DOTS 1.000
score AC_SPAMMY_URI_PATTERNS1 1.000
@@ -281,7 +281,6 @@ score GOOG_STO_HTML_PHISH_MANY 1.0
score GOOG_STO_IMG_NOHTML 1.000
score HAS_X_NO_RELAY 1.000
score HAS_X_OUTGOING_SPAM_STAT 1.000
-score HDRS_LCASE 0.100
score HEXHASH_WORD 1.000
score HK_CTE_RAW 1.000
score HK_LOTTO 1.000

Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1915099&r1=1915098&r2=1915099&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Sat Jan 6 02:44:31 2024
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 444002 62.012% (99.259% of non-spam corpus)
-# Correctly spam: 187985 26.255% (69.966% of spam corpus)
-# False positives: 3313 0.463% (0.741% of nonspam, 62714 weighted)
-# False negatives: 80696 11.270% (30.034% of spam, 144134 weighted)
-# Average score for spam: 6.9 nonspam: 0.6
-# Average for false-pos: 6.3 false-neg: 1.8
-# TOTAL: 715996 100.00%
+# Correctly non-spam: 442890 63.414% (99.185% of non-spam corpus)
+# Correctly spam: 173995 24.913% (69.078% of spam corpus)
+# False positives: 3639 0.521% (0.815% of nonspam, 63496 weighted)
+# False negatives: 77886 11.152% (30.922% of spam, 132919 weighted)
+# Average score for spam: 6.7 nonspam: 0.6
+# Average for false-pos: 6.2 false-neg: 1.7
+# TOTAL: 698410 100.00%

Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 55392 99.31%
-# Correctly spam: 22070 65.71%
-# False positives: 385 0.69%
-# False negatives: 11517 34.29%
-# TCR(l=50): 1.091657 SpamRecall: 65.710% SpamPrec: 98.285%
+# Correctly non-spam: 55262 99.25%
+# Correctly spam: 20295 64.55%
+# False positives: 418 0.75%
+# False negatives: 11148 35.45%
+# TCR(l=50): 0.981122 SpamRecall: 64.545% SpamPrec: 97.982%

##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 435489 97.36%
-# Correctly spam: 127405 47.42%
-# False positives: 11826 2.64%
-# False negatives: 141276 52.58%
-# TCR(l=50): 0.366762 SpamRecall: 47.419% SpamPrec: 91.506%
+# Correctly non-spam: 434897 97.40%
+# Correctly spam: 119828 47.57%
+# False positives: 11632 2.60%
+# False negatives: 132053 52.43%
+# TCR(l=50): 0.352946 SpamRecall: 47.573% SpamPrec: 91.152%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 54338 97.42%
-# Correctly spam: 15885 47.30%
-# False positives: 1439 2.58%
-# False negatives: 17702 52.70%
-# TCR(l=50): 0.374637 SpamRecall: 47.295% SpamPrec: 91.694%
+# Correctly non-spam: 54211 97.36%
+# Correctly spam: 14964 47.59%
+# False positives: 1469 2.64%
+# False negatives: 16479 52.41%
+# TCR(l=50): 0.349642 SpamRecall: 47.591% SpamPrec: 91.061%

Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1915099&r1=1915098&r2=1915099&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Sat Jan 6 02:44:31 2024
@@ -1,12 +1,12 @@
##### WITH NEW RULES AND SCORES #####

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 434897 80.801% (99.334% of non-spam corpus)
-# Correctly spam: 61612 11.447% (61.356% of spam corpus)
-# False positives: 2916 0.542% (0.666% of nonspam, 42941 weighted)
-# False negatives: 38806 7.210% (38.644% of spam, 63763 weighted)
+# Correctly non-spam: 434925 80.806% (99.340% of non-spam corpus)
+# Correctly spam: 61478 11.422% (61.222% of spam corpus)
+# False positives: 2888 0.537% (0.660% of nonspam, 42616 weighted)
+# False negatives: 38940 7.235% (38.778% of spam, 64474 weighted)
# Average score for spam: 7.0 nonspam: -1.6
-# Average for false-pos: 6.4 false-neg: 1.6
+# Average for false-pos: 6.4 false-neg: 1.7
# TOTAL: 538231 100.00%

Reading scores from "tmprules"...
@@ -14,10 +14,10 @@ Reading per-message hit stat logs and sc

# SUMMARY for threshold 5.0:
# Correctly non-spam: 54262 99.39%
-# Correctly spam: 7731 60.94%
+# Correctly spam: 7733 60.95%
# False positives: 331 0.61%
-# False negatives: 4956 39.06%
-# TCR(l=50): 0.589928 SpamRecall: 60.936% SpamPrec: 95.894%
+# False negatives: 4954 39.05%
+# TCR(l=50): 0.589983 SpamRecall: 60.952% SpamPrec: 95.895%

##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
@@ -25,16 +25,16 @@ Reading per-message hit stat logs and sc

# SUMMARY for threshold 5.0:
# Correctly non-spam: 436003 99.59%
-# Correctly spam: 20756 20.67%
+# Correctly spam: 20766 20.68%
# False positives: 1810 0.41%
-# False negatives: 79662 79.33%
-# TCR(l=50): 0.590132 SpamRecall: 20.670% SpamPrec: 91.979%
+# False negatives: 79652 79.32%
+# TCR(l=50): 0.590166 SpamRecall: 20.680% SpamPrec: 91.983%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
# Correctly non-spam: 54399 99.64%
-# Correctly spam: 2577 20.31%
+# Correctly spam: 2593 20.44%
# False positives: 194 0.36%
-# False negatives: 10110 79.69%
-# TCR(l=50): 0.640434 SpamRecall: 20.312% SpamPrec: 92.999%
+# False negatives: 10094 79.56%
+# TCR(l=50): 0.640952 SpamRecall: 20.438% SpamPrec: 93.039%