Mailing List Archive

svn commit: r1914644 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1
Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1914644&r1=1914643&r2=1914644&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Thu Dec 14 02:46:24 2023
@@ -1,208 +1,207 @@
# Using score set 1 logs for revision 1914480 from:
# ham-net-ena-week0.r1914480.log ham-net-ena-week1.r1914480.log ham-net-ena-week2.r1914480.log ham-net-ena-week3.r1914480.log ham-net-ena-week4.r1914480.log ham-net-giovanni-ham.r1914480.log ham-net-giovanni-spammy.r1914480.log ham-net-giovanni-spam.r1914480.log ham-net-grenier.r1914480.log ham-net-hege.r1914480.log ham-net-jhardin.r1914480.log ham-net-llanga.r1914480.log ham-net-mmiroslaw-mails-ham.r1914480.log ham-net-mmiroslaw-mails-spam.r1914480.log ham-net-spamsponge.r1914480.log ham-net-whyscream.r1914480.log spam-net-ena-week0.r1914480.log spam-net-ena-week1.r1914480.log spam-net-ena-week2.r1914480.log spam-net-ena-week3.r1914480.log spam-net-ena-week4.r1914480.log spam-net-giovanni-ham.r1914480.log spam-net-giovanni-spammy.r1914480.log spam-net-giovanni-spam.r1914480.log spam-net-grenier.r1914480.log spam-net-hege.r1914480.log spam-net-jhardin.r1914480.log spam-net-llanga.r1914480.log spam-net-mmiroslaw-mails-ham.r1914480.log spam-net-mmiroslaw-mails-spam.r1914480.log spam-n
et-spamsponge.r1914480.log spam-net-whyscream.r1914480.log

-score ACCT_PHISHING_MANY 2.999
+score ACCT_PHISHING_MANY 3.000
score AC_BR_BONANZA 0.001
score AC_DIV_BONANZA 0.001
score AC_FROM_MANY_DOTS 2.499
score AC_HTML_NONSENSE_TAGS 1.999
-score AC_POST_EXTRAS 0.313
+score AC_POST_EXTRAS 0.318
score ADMITS_SPAM 2.299
-score ADVANCE_FEE_2_NEW_MONEY 1.681
+score ADVANCE_FEE_2_NEW_MONEY 1.999
score ADVANCE_FEE_3_NEW 3.499
score ADVANCE_FEE_3_NEW_MONEY 0.001
score ADVANCE_FEE_4_NEW 2.199
-score ADVANCE_FEE_4_NEW_MONEY 0.439
+score ADVANCE_FEE_4_NEW_MONEY 0.377
score ADVANCE_FEE_5_NEW_FRM_MNY 0.001
-score ADVANCE_FEE_5_NEW_MONEY 2.612
-score AD_PREFS 0.444
+score ADVANCE_FEE_5_NEW_MONEY 1.332
+score AD_PREFS 0.066
score AXB_XMAILER_MIMEOLE_OL_024C2 0.001
-score BITCOIN_EXTORT_01 1.306
-score BITCOIN_MALF_HTML 0.001 # force non-zero
-score BITCOIN_ONAN 1.912
-score BITCOIN_PAY_ME 1.664
-score BITCOIN_SPAM_02 1.107
+score BITCOIN_EXTORT_01 0.725
+score BITCOIN_MALF_HTML 0.001
+score BITCOIN_ONAN 2.454
+score BITCOIN_PAY_ME 1.149
+score BITCOIN_SPAM_02 1.222
score BITCOIN_SPAM_05 0.001
-score BITCOIN_SPAM_07 0.001
-score BITCOIN_TOEQFM 3.149
+score BITCOIN_SPAM_07 0.369
+score BITCOIN_TOEQFM 3.163
score BITCOIN_VISTA 0.001
-score BITCOIN_XPRIO 0.955
-score BITCOIN_YOUR_INFO 3.000
-score BODY_SINGLE_URI 0.001
+score BITCOIN_XPRIO 1.124
+score BITCOIN_YOUR_INFO 2.999
+score BODY_SINGLE_URI 0.001 # force non-zero
score BODY_SINGLE_WORD 0.001
-score BODY_URI_ONLY 2.269
-score CK_HELO_GENERIC 0.250
+score BODY_URI_ONLY 2.268
+score CK_HELO_GENERIC 0.249
score CTE_8BIT_MISMATCH 0.001
-score DEAR_BENEFICIARY 0.656
+score DEAR_BENEFICIARY 0.602
score DKIMWL_WL_HIGH -0.001
score DKIMWL_WL_MED -0.001 # force non-zero
score DKIMWL_WL_MEDHI -0.001
-score DYNAMIC_IMGUR 2.623
+score DYNAMIC_IMGUR 3.249
score END_FUTURE_EMAILS 2.499
-score FILL_THIS_FORM 0.499
+score FILL_THIS_FORM 0.600
score FONT_INVIS_DIRECT 0.001
score FONT_INVIS_LONG_LINE 3.000
-score FONT_INVIS_MSGID 1.976
-score FONT_INVIS_NORDNS 0.567
+score FONT_INVIS_MSGID 1.905
+score FONT_INVIS_NORDNS 1.292
score FONT_INVIS_POSTEXTRAS 3.499
score FORGED_SPF_HELO 2.799
-score FORM_FRAUD_5 2.671
-score FREEMAIL_FORGED_FROMDOMAIN 0.250
+score FORM_FRAUD_5 2.647
+score FREEMAIL_FORGED_FROMDOMAIN 0.249
score FROM_ADDR_WS 2.999
score FROM_FMBLA_NEWDOM28 0.799
-score FROM_GOV_DKIM_AU -0.141
-score FROM_IN_TO_AND_SUBJ 1.190
+score FROM_GOV_DKIM_AU -0.392
+score FROM_IN_TO_AND_SUBJ 1.191
score FROM_MISSPACED 1.999
score FROM_MISSP_DYNIP 0.001
-score FROM_MISSP_EH_MATCH 1.299
-score FROM_MISSP_FREEMAIL 1.956
-score FROM_MISSP_MSFT 1.648
-score FROM_MISSP_REPLYTO 1.885
-score FROM_MISSP_SPF_FAIL 0.922
-score FROM_MISSP_TO_UNDISC 3.343
-score FROM_MISSP_USER 0.001 # force non-zero
+score FROM_MISSP_EH_MATCH 1.300
+score FROM_MISSP_FREEMAIL 1.952
+score FROM_MISSP_MSFT 1.349
+score FROM_MISSP_REPLYTO 1.882
+score FROM_MISSP_SPF_FAIL 1.034
+score FROM_MISSP_TO_UNDISC 3.324
+score FROM_MISSP_USER 0.001
score FROM_MISSP_XPRIO 2.499
-score FROM_PAYPAL_SPOOF 1.599
+score FROM_PAYPAL_SPOOF 0.531
score FROM_SUSPICIOUS_NTLD 0.500
score FROM_SUSPICIOUS_NTLD_FP 1.999
-score FROM_UNBAL1 2.299
+score FROM_UNBAL1 2.200
score FROM_WSP_TRAIL 2.399
-score FSL_BULK_SIG 2.081
-score FSL_CTYPE_WIN1251 0.438
+score FSL_BULK_SIG 2.074
+score FSL_CTYPE_WIN1251 0.428
score FSL_HAS_TINYURL 2.299
score FSL_NEW_HELO_USER 0.001
score FUZZY_AMAZON 2.499
-score FUZZY_BITCOIN 1.036
+score FUZZY_BITCOIN 1.180
score FUZZY_WALLET 1.899
score GB_BITCOIN_CP 0.001
score GB_CUSTOM_HTM_URI 1.499
-score GB_FAKE_RF_SHORT 1.130
+score GB_FAKE_RF_SHORT 1.127
score GB_FREEMAIL_DISPTO 0.001
-score GB_HASHBL_BTC 0.570
+score GB_HASHBL_BTC 1.038
score GOOG_REDIR_NORDNS 0.001
score GOOG_STO_IMG_HTML 2.999
score GOOG_STO_NOIMG_HTML 2.999
score HAS_X_OUTGOING_SPAM_STAT 0.001
-score HDRS_LCASE_IMGONLY 0.100
+score HDRS_LCASE_IMGONLY 0.099
score HDRS_MISSP 2.499
score HDR_ORDER_FTSDMCXX_DIRECT 0.001
score HDR_ORDER_FTSDMCXX_NORDNS 0.001
-score HEADER_FROM_DIFFERENT_DOMAINS 0.250
-score HELO_MISC_IP 0.249
+score HEADER_FROM_DIFFERENT_DOMAINS 0.249
+score HELO_MISC_IP 0.250
score HELO_NO_DOMAIN 0.001
score HK_NAME_FM_MR_MRS 1.499
-score HK_NAME_MR_MRS 1.000
+score HK_NAME_MR_MRS 0.999
score HK_RANDOM_ENVFROM 0.999
-score HK_RANDOM_FROM 1.000
+score HK_RANDOM_FROM 0.999
score HK_RANDOM_REPLYTO 0.999
score HK_SCAM 1.999
score HOSTED_IMG_DIRECT_MX 3.499
-score HOSTED_IMG_FREEM 3.004
+score HOSTED_IMG_FREEM 3.016
score HOSTED_IMG_MULTI_PUB_01 2.999
-score HTML_BADATTR 0.858
+score HTML_BADATTR 1.000
score HTML_ENTITY_ASCII_TINY 2.999
score HTML_FONT_TINY_NORDNS 0.001
score HTML_SINGLET_MANY 2.499
-score HTML_TEXT_INVISIBLE_FONT 1.677
-score HTML_TEXT_INVISIBLE_STYLE 2.425
+score HTML_TEXT_INVISIBLE_FONT 1.747
+score HTML_TEXT_INVISIBLE_STYLE 2.533
score JH_SPAMMY_HEADERS 3.499
score KHOP_HELO_FCRDNS 0.260
score LONG_HEX_URI 2.999
-score LONG_IMG_URI 2.936
-score LONG_INVISIBLE_TEXT 2.696
+score LONG_IMG_URI 2.941
+score LONG_INVISIBLE_TEXT 2.699
score LOTS_OF_MONEY 0.010
score LOTTO_DEPT 1.999
score MALFORMED_FREEMAIL 2.699
-score MALWARE_NORDNS 0.892
-score MILLION_HUNDRED 0.439
+score MALWARE_NORDNS 0.985
+score MANY_SUBDOM 2.200
+score MILLION_HUNDRED 0.397
score MILLION_USD 1.999
score MIMEOLE_DIRECT_TO_MX 0.001
-score MIME_NO_TEXT 1.999
+score MIME_NO_TEXT 0.602
score MIXED_ES 2.099
score MIXED_HREF_CASE 1.999
-score MONEY_ATM_CARD 0.758
-score MONEY_FORM 0.001 # force non-zero
-score MONEY_FORM_SHORT 1.993
-score MONEY_FRAUD_3 0.001 # force non-zero
-score MONEY_FRAUD_5 1.498
-score MONEY_FRAUD_8 1.522
-score MONEY_FREEMAIL_REPTO 1.321
+score MONEY_ATM_CARD 1.000
+score MONEY_FORM 0.001
+score MONEY_FORM_SHORT 1.893
+score MONEY_FRAUD_3 0.001
+score MONEY_FRAUD_5 1.449
+score MONEY_FRAUD_8 2.233
+score MONEY_FREEMAIL_REPTO 1.316
score MONEY_FROM_MISSP 0.001
-score MONEY_NOHTML 1.209
+score MONEY_NOHTML 1.263
score NA_DOLLARS 1.499
-score NICE_REPLY_A -0.702
-score NORDNS_LOW_CONTRAST 0.001
+score NICE_REPLY_A -2.012
+score NORDNS_LOW_CONTRAST 0.001 # force non-zero
score NO_FM_NAME_IP_HOSTN 0.001
score NSL_RCVD_FROM_USER 0.001
score NSL_RCVD_HELO_USER 0.001
-score OBFU_BITCOIN 1.103
+score OBFU_BITCOIN 0.778
score OBFU_TEXT_ATTACH 1.599
-score ODD_FREEM_REPTO 2.592
+score ODD_FREEM_REPTO 2.597
score PDS_BAD_THREAD_QP_64 0.999
score PDS_BTC_ID 0.499
-score PDS_BTC_MSGID 0.001
+score PDS_BTC_MSGID 0.001 # force non-zero
score PDS_EMPTYSUBJ_URISHRT 1.499
score PDS_FRNOM_TODOM_DBL_URL 0.001
score PDS_FRNOM_TODOM_NAKED_TO 1.499
-score PDS_FROM_2_EMAILS 2.300
score PDS_FROM_NAME_TO_DOMAIN 1.999
score PDS_HELO_SPF_FAIL 1.999
score PDS_HP_HELO_NORDNS 0.001
score PDS_NAKED_TO_NUMERO 1.999
score PDS_OTHER_BAD_TLD 1.999
score PDS_TINYSUBJ_URISHRT 1.499
-score PHP_SCRIPT 2.499
+score PHP_SCRIPT 2.500
score PP_MIME_FAKE_ASCII_TEXT 0.001
score RAND_MKTG_HEADER 1.999
score RATWARE_NO_RDNS 0.001
-score RCVD_IN_MSPIKE_H2 -0.001 # force non-zero
+score RCVD_IN_MSPIKE_H2 -0.001
score SCC_BODY_SINGLE_WORD 0.001
-score SCC_CANSPAM_2 0.696
+score SCC_CANSPAM_2 1.188
score SCC_ISEMM_LID_1B 1.499
-score SENDGRID_REDIR 0.590
+score SENDGRID_REDIR 0.600
score SHOPIFY_IMG_NOT_RCVD_SFY 2.499
score SHORTENED_URL_SRC 2.399
score SHORT_SHORTNER 1.999
score SPOOFED_FREEMAIL 0.001
-score SPOOFED_FREEMAIL_NO_RDNS 0.001
-score SPOOFED_FREEM_REPTO 1.939
-score STATIC_XPRIO_OLE 0.764
-score STOX_BOUND_090909_B 0.001
+score SPOOFED_FREEMAIL_NO_RDNS 0.001 # force non-zero
+score SPOOFED_FREEM_REPTO 1.893
+score STATIC_XPRIO_OLE 0.768
score SUBJ_ATTENTION 0.499
score THIS_AD 0.700
score TONOM_EQ_TOLOC_SHRT_SHRTNER 1.499
score TO_EQ_FM_DIRECT_MX 2.499
-score TO_EQ_FM_DOM_SPF_FAIL 0.054
-score TO_EQ_FM_SPF_FAIL 1.321
+score TO_EQ_FM_DOM_SPF_FAIL 0.478
+score TO_EQ_FM_SPF_FAIL 0.899
score TO_IN_SUBJ 0.099
-score TO_NO_BRKTS_FROM_MSSP 2.500
+score TO_NO_BRKTS_FROM_MSSP 2.499
score TO_NO_BRKTS_HTML_IMG 1.999
score TO_NO_BRKTS_HTML_ONLY 1.999
-score TO_NO_BRKTS_MSFT 2.481
+score TO_NO_BRKTS_MSFT 2.479
score TO_NO_BRKTS_NORDNS_HTML 1.999
-score TO_NO_BRKTS_PCNT 2.215
+score TO_NO_BRKTS_PCNT 2.329
score TVD_SPACE_RATIO_MINFP 0.001 # force non-zero
score UNDISC_FREEM 2.599
-score UNDISC_MONEY 2.799
+score UNDISC_MONEY 2.899
score UNICODE_OBFU_ZW_MANY 2.999
-score URI_DOTEDU 1.999
+score URI_DOTEDU 1.040
score URI_GOOGLE_PROXY 1.699
score URI_IN_URI_5 3.199
score URI_PHISH 3.999
-score URI_PHP_REDIR 2.419
+score URI_PHP_REDIR 2.488
score URI_TRY_3LD 1.999
-score URI_WP_HACKED_2 2.499
+score URI_WP_HACKED_2 2.500
score VFY_ACCT_NORDNS 2.999
score VISTA_COST 2.499
score VISTA_TONOM_EQ_TOLOC 2.499
score WIKI_IMG 1.999
-score WORD_INVIS 1.898
+score WORD_INVIS 1.897
score WORD_INVIS_MANY 2.999
score XFER_LOTSA_MONEY 0.001
-score XM_DIGITS_ONLY 2.407
+score XM_DIGITS_ONLY 2.229
score XM_RANDOM 2.499
score XM_UC_ONLY 2.499
-score XPRIO 0.138
+score XPRIO 0.084
score AC_SPAMMY_URI_PATTERNS1 1.000
score AC_SPAMMY_URI_PATTERNS10 1.000
score AC_SPAMMY_URI_PATTERNS11 1.000

Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1914644&r1=1914643&r2=1914644&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Thu Dec 14 02:46:24 2023
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 454891 62.796% (99.153% of non-spam corpus)
-# Correctly spam: 165147 22.798% (62.175% of spam corpus)
-# False positives: 3884 0.536% (0.847% of nonspam, 73576 weighted)
-# False negatives: 100471 13.870% (37.825% of spam, 203450 weighted)
-# Average score for spam: 6.5 nonspam: 0.7
-# Average for false-pos: 6.5 false-neg: 2.0
-# TOTAL: 724393 100.00%
+# Correctly non-spam: 455062 62.774% (99.188% of non-spam corpus)
+# Correctly spam: 163975 22.620% (61.615% of spam corpus)
+# False positives: 3726 0.514% (0.812% of nonspam, 71550 weighted)
+# False negatives: 102153 14.092% (38.385% of spam, 210470 weighted)
+# Average score for spam: 6.5 nonspam: 0.6
+# Average for false-pos: 6.6 false-neg: 2.1
+# TOTAL: 724916 100.00%

Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 56747 99.19%
-# Correctly spam: 20323 61.16%
-# False positives: 466 0.81%
-# False negatives: 12907 38.84%
-# TCR(l=50): 0.917778 SpamRecall: 61.159% SpamPrec: 97.758%
+# Correctly non-spam: 56727 99.15%
+# Correctly spam: 20350 61.13%
+# False positives: 488 0.85%
+# False negatives: 12939 38.87%
+# TCR(l=50): 0.891534 SpamRecall: 61.131% SpamPrec: 97.658%

##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 446456 97.32%
-# Correctly spam: 108948 41.02%
-# False positives: 12318 2.68%
-# False negatives: 156670 58.98%
-# TCR(l=50): 0.343811 SpamRecall: 41.017% SpamPrec: 89.842%
+# Correctly non-spam: 446241 97.27%
+# Correctly spam: 108793 40.88%
+# False positives: 12547 2.73%
+# False negatives: 157335 59.12%
+# TCR(l=50): 0.339153 SpamRecall: 40.880% SpamPrec: 89.660%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 55624 97.22%
-# Correctly spam: 13610 40.96%
-# False positives: 1589 2.78%
-# False negatives: 19620 59.04%
-# TCR(l=50): 0.335419 SpamRecall: 40.957% SpamPrec: 89.545%
+# Correctly non-spam: 55533 97.06%
+# Correctly spam: 13537 40.67%
+# False positives: 1682 2.94%
+# False negatives: 19752 59.33%
+# TCR(l=50): 0.320543 SpamRecall: 40.665% SpamPrec: 88.948%

Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1914644&r1=1914643&r2=1914644&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Thu Dec 14 02:46:24 2023
@@ -1,10 +1,10 @@
##### WITH NEW RULES AND SCORES #####

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 430772 85.340% (99.397% of non-spam corpus)
-# Correctly spam: 26817 5.313% (37.568% of spam corpus)
-# False positives: 2615 0.518% (0.603% of nonspam, 30304 weighted)
-# False negatives: 44566 8.829% (62.432% of spam, 67994 weighted)
+# Correctly non-spam: 430764 85.339% (99.395% of non-spam corpus)
+# Correctly spam: 26806 5.311% (37.552% of spam corpus)
+# False positives: 2623 0.520% (0.605% of nonspam, 30355 weighted)
+# False negatives: 44577 8.831% (62.448% of spam, 67988 weighted)
# Average score for spam: 5.5 nonspam: -0.9
# Average for false-pos: 7.0 false-neg: 1.5
# TOTAL: 504770 100.00%
@@ -13,11 +13,11 @@ Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 53676 99.38%
-# Correctly spam: 3410 37.90%
-# False positives: 333 0.62%
-# False negatives: 5588 62.10%
-# TCR(l=50): 0.404623 SpamRecall: 37.897% SpamPrec: 91.103%
+# Correctly non-spam: 53681 99.39%
+# Correctly spam: 3406 37.85%
+# False positives: 328 0.61%
+# False negatives: 5592 62.15%
+# TCR(l=50): 0.409149 SpamRecall: 37.853% SpamPrec: 91.216%

##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
@@ -25,16 +25,16 @@ Reading per-message hit stat logs and sc

# SUMMARY for threshold 5.0:
# Correctly non-spam: 431752 99.62%
-# Correctly spam: 13735 19.24%
+# Correctly spam: 13717 19.22%
# False positives: 1635 0.38%
-# False negatives: 57648 80.76%
-# TCR(l=50): 0.512081 SpamRecall: 19.241% SpamPrec: 89.362%
+# False negatives: 57666 80.78%
+# TCR(l=50): 0.512014 SpamRecall: 19.216% SpamPrec: 89.350%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
# Correctly non-spam: 53807 99.63%
-# Correctly spam: 1748 19.43%
+# Correctly spam: 1750 19.45%
# False positives: 202 0.37%
-# False negatives: 7250 80.57%
-# TCR(l=50): 0.518617 SpamRecall: 19.427% SpamPrec: 89.641%
+# False negatives: 7248 80.55%
+# TCR(l=50): 0.518677 SpamRecall: 19.449% SpamPrec: 89.652%