Mailing List Archive

svn commit: r1877462 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1
Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1877462&r1=1877461&r2=1877462&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Thu May 7 06:18:20 2020
@@ -4,194 +4,190 @@
score AC_BR_BONANZA 0.001
score AC_DIV_BONANZA 0.001
score AC_FROM_MANY_DOTS 0.001
-score ADMITS_SPAM 1.493
score ADVANCE_FEE_2_NEW_MONEY 1.999
-score ADVANCE_FEE_3_NEW 3.468
-score ADVANCE_FEE_3_NEW_MONEY 2.212
+score ADVANCE_FEE_3_NEW 3.467
+score ADVANCE_FEE_3_NEW_MONEY 2.177
score ADVANCE_FEE_4_NEW_MONEY 0.001
-score ADVANCE_FEE_5_NEW 2.603
-score AD_PREFS 0.274
+score ADVANCE_FEE_5_NEW 2.899
+score AD_PREFS 0.107
score AXB_XMAILER_MIMEOLE_OL_024C2 0.001
-score BITCOIN_EXTORT_01 2.499
-score BITCOIN_SPAM_01 1.144
-score BITCOIN_SPAM_02 2.056
+score BITCOIN_EXTORT_01 3.064
+score BITCOIN_SPAM_01 1.009
+score BITCOIN_SPAM_02 2.483
score BITCOIN_SPAM_03 2.499
-score BITCOIN_SPAM_05 1.681
-score BITCOIN_SPAM_07 3.500
+score BITCOIN_SPAM_05 2.020
+score BITCOIN_SPAM_07 3.499
score BITCOIN_SPAM_09 0.001
-score BODY_SINGLE_URI 0.001
+score BODY_SINGLE_URI 0.581
score BODY_SINGLE_WORD 0.001
-score BODY_URI_ONLY 1.000
-score CK_HELO_DYNAMIC_SPLIT_IP 1.500
-score CK_HELO_GENERIC 0.250
+score BODY_URI_ONLY 0.999
+score CK_HELO_DYNAMIC_SPLIT_IP 1.499
+score CK_HELO_GENERIC 0.249
score CTE_8BIT_MISMATCH 0.999
-score CTYPE_NULL 2.598
+score CTYPE_NULL 2.597
score DEAR_BENEFICIARY 0.001
-score DKIMWL_BL 2.512
+score DKIMWL_BL 2.518
score DKIMWL_WL_HIGH -0.001
score DKIMWL_WL_MED -0.001
-score DKIMWL_WL_MEDHI -0.001 # force non-zero
+score DKIMWL_WL_MEDHI -0.001
score DX_TEXT_03 0.899
score END_FUTURE_EMAILS 2.499
score FILL_THIS_FORM 0.001
-score FORGED_RELAY_MUA_TO_MX 3.500
-score FORGED_SPF_HELO 1.757
-score FORM_FRAUD_5 0.001
+score FORGED_RELAY_MUA_TO_MX 3.519
+score FORGED_SPF_HELO 1.867
+score FORM_FRAUD_5 0.001 # force non-zero
score FREEMAIL_FORGED_FROMDOMAIN 0.250
score FROM_2_EMAILS_SHORT 0.001
-score FROM_ADDR_WS 2.999
-score FROM_FMBLA_NEWDOM 1.500
+score FROM_ADDR_WS 3.000
+score FROM_FMBLA_NEWDOM 1.499
score FROM_FMBLA_NEWDOM14 0.999
score FROM_FMBLA_NEWDOM28 0.799
score FROM_GOV_DKIM_AU -0.001
-score FROM_GOV_SPOOF 0.568
+score FROM_GOV_SPOOF 0.569
score FROM_MISSPACED 0.001
score FROM_MISSP_DYNIP 3.699
score FROM_MISSP_EH_MATCH 0.001
score FROM_MISSP_FREEMAIL 0.001
score FROM_MISSP_MSFT 0.001
-score FROM_MISSP_PHISH 1.245
-score FROM_MISSP_REPLYTO 2.295
+score FROM_MISSP_PHISH 1.243
+score FROM_MISSP_REPLYTO 2.394
score FROM_MISSP_SPF_FAIL 0.001
-score FROM_MISSP_TO_UNDISC 2.620
score FROM_MISSP_USER 0.001
score FROM_MISSP_XPRIO 0.001
-score FROM_NTLD_REPLY_FREEMAIL 0.001 # force non-zero
+score FROM_NTLD_REPLY_FREEMAIL 0.001
score FROM_PAYPAL_SPOOF 0.001
score FROM_SUSPICIOUS_NTLD 0.499
score FROM_SUSPICIOUS_NTLD_FP 0.001
-score FSL_BULK_SIG 0.001
+score FSL_BULK_SIG 0.001 # force non-zero
score FSL_CTYPE_WIN1251 0.001
score FSL_NEW_HELO_USER 0.001
score FUZZY_BITCOIN 0.001
-score FUZZY_SECURITY 1.089
+score FUZZY_SECURITY 1.060
score FUZZY_WALLET 0.001
score GB_BITCOIN_CP 2.999
score GB_BITCOIN_NH 0.001
-score GB_FREEMAIL_DISPTO 0.499
-score GB_GOOGLE_OBFUS 0.749
+score GB_FREEMAIL_DISPTO 0.500
+score GB_GOOGLE_OBFUS 0.455
score HDRS_LCASE 0.100
-score HDRS_LCASE_IMGONLY 0.099
-score HDR_ORDER_FTSDMCXX_DIRECT 0.001 # force non-zero
-score HDR_ORDER_FTSDMCXX_NORDNS 0.657
+score HDRS_LCASE_IMGONLY 0.100
+score HDR_ORDER_FTSDMCXX_DIRECT 0.001
+score HDR_ORDER_FTSDMCXX_NORDNS 1.145
score HEADER_FROM_DIFFERENT_DOMAINS 0.250
-score HELO_MISC_IP 0.001 # force non-zero
+score HELO_MISC_IP 0.001
score HELO_NO_DOMAIN 0.001
score HEXHASH_WORD 2.999
-score HK_NAME_FROM 0.999
score HK_NAME_MR_MRS 0.999
score HK_RANDOM_FROM 0.999
score HK_RANDOM_REPLYTO 0.999
-score HK_RCVD_IP_MULTICAST 0.421
-score HK_SCAM 1.254
-score HOSTED_IMG_DIRECT_MX 2.024
+score HK_RCVD_IP_MULTICAST 0.105
+score HK_SCAM 1.433
+score HOSTED_IMG_DIRECT_MX 2.753
score HTML_OFF_PAGE 0.001
-score HTML_SINGLET_MANY 1.636
-score HTML_TEXT_INVISIBLE_STYLE 1.719
+score HTML_SINGLET_MANY 1.554
+score HTML_TEXT_INVISIBLE_STYLE 1.644
score IMG_ONLY_FM_DOM_INFO 2.499
-score KB_FORGED_MOZ4 4.164
-score KHOP_FAKE_EBAY 0.483
-score KHOP_HELO_FCRDNS 0.276
+score KB_FORGED_MOZ4 4.299
+score KHOP_FAKE_EBAY 0.476
+score KHOP_HELO_FCRDNS 0.275
score LIST_PARTIAL_SHORT_MSG 2.499
-score LIST_PRTL_SAME_USER 0.543
+score LIST_PRTL_SAME_USER 0.735
score LONG_HEX_URI 1.617
-score LONG_IMG_URI 0.001
+score LONG_IMG_URI 0.001 # force non-zero
score LOTS_OF_MONEY 0.010
score MALF_HTML_B64 3.499
-score MANY_SPAN_IN_TEXT 3.629
+score MANY_SPAN_IN_TEXT 3.699
score MAY_BE_FORGED 0.001
-score MILLION_HUNDRED 0.936
+score MILLION_HUNDRED 0.802
score MIMEOLE_DIRECT_TO_MX 0.001
score MIME_NO_TEXT 1.999
-score MONEY_FORM_SHORT 0.001 # force non-zero
-score MONEY_FRAUD_3 1.039
-score MONEY_FRAUD_5 0.836
-score MONEY_FRAUD_8 0.001 # force non-zero
+score MONEY_FORM_SHORT 0.001
+score MONEY_FRAUD_3 1.032
+score MONEY_FRAUD_5 1.002
+score MONEY_FRAUD_8 0.001
score MONEY_FROM_41 1.999
score MONEY_FROM_MISSP 1.999
-score MSM_PRIO_REPTO 2.409
-score NORDNS_LOW_CONTRAST 1.994
-score NO_FM_NAME_IP_HOSTN 1.689
-score NSL_RCVD_FROM_USER 0.001 # force non-zero
-score NSL_RCVD_HELO_USER 2.299
-score NUMBERONLY_BITCOIN_EXP 0.398
-score OBFU_BITCOIN 1.999
-score PDS_BTC_ID 0.500
-score PDS_BTC_MSGID 0.999
+score MSM_PRIO_REPTO 2.176
+score NORDNS_LOW_CONTRAST 2.069
+score NO_FM_NAME_IP_HOSTN 1.246
+score NSL_RCVD_FROM_USER 0.001
+score NSL_RCVD_HELO_USER 2.361
+score NUMBERONLY_BITCOIN_EXP 1.999
+score OBFU_BITCOIN 1.434
+score PDS_BTC_ID 0.499
+score PDS_BTC_MSGID 1.000
score PDS_EMPTYSUBJ_URISHRT 0.001
score PDS_FREEMAIL_REPLYTO_URISHRT 0.001
-score PDS_FRNOM_TODOM_NAKED_TO 1.499
-score PDS_FROM_2_EMAILS 1.599
+score PDS_FRNOM_TODOM_NAKED_TO 1.500
+score PDS_FROM_2_EMAILS 0.921
score PDS_FROM_NAME_TO_DOMAIN 1.000
score PDS_HELO_SPF_FAIL 1.999
score PDS_HP_HELO_NORDNS 0.001
-score PDS_NAKED_TO_NUMERO 1.075
+score PDS_NAKED_TO_NUMERO 1.524
score PDS_NO_FULL_NAME_SPOOFED_URL 0.749
score PDS_OTHER_BAD_TLD 1.999
-score PDS_SHORTFWD_URISHRT 1.499
-score PDS_SHORT_SPOOFED_URL 2.000
-score PDS_TINYSUBJ_URISHRT 0.469
-score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 1.391
+score PDS_SHORTFWD_URISHRT 0.785
+score PDS_SHORT_SPOOFED_URL 1.999
+score PDS_TINYSUBJ_URISHRT 0.001
+score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 0.812
score PDS_TONAME_EQ_TOLOCAL_HDRS_LCASE 1.999
score PDS_TONAME_EQ_TOLOCAL_SHORT 1.999
score PDS_TONAME_EQ_TOLOCAL_VSHORT 0.999
score PDS_TO_EQ_FROM_NAME 0.001
score PHP_ORIG_SCRIPT 2.499
-score PP_MIME_FAKE_ASCII_TEXT 1.000
+score PP_MIME_FAKE_ASCII_TEXT 0.722
score RATWARE_NO_RDNS 0.001
score RCVD_IN_MSPIKE_H2 -0.001
-score RDNS_NUM_TLD_ATCHNX 0.474
-score RDNS_NUM_TLD_XM 0.362
-score RISK_FREE 1.606
-score SCRIPT_GIBBERISH 1.686
-score SERGIO_SUBJECT_PORN014 4.199
-score SERGIO_SUBJECT_VIAGRA01 0.001
-score SHOPIFY_IMG_NOT_RCVD_SFY 2.499
-score SHORTENER_SHORT_IMG 0.001
-score SHORT_IMG_SUSP_NTLD 0.860
-score SHORT_SHORTNER 1.999
+score RDNS_NUM_TLD_ATCHNX 0.088
+score RDNS_NUM_TLD_XM 2.999
+score RISK_FREE 3.099
+score SCRIPT_GIBBERISH 1.682
+score SERGIO_SUBJECT_PORN014 1.505
+score SERGIO_SUBJECT_VIAGRA01 0.001 # force non-zero
+score SHOPIFY_IMG_NOT_RCVD_SFY 2.500
+score SHORTENER_SHORT_IMG 1.360
+score SHORT_IMG_SUSP_NTLD 1.200
+score SHORT_SHORTNER 1.973
score SINGLETS_LOW_CONTRAST 0.001
score SPOOFED_FREEMAIL 1.999
score SPOOFED_FREEMAIL_NO_RDNS 0.001
-score SPOOFED_FREEM_REPTO 0.718
+score SPOOFED_FREEM_REPTO 0.703
score STATIC_XPRIO_OLE 0.001
score STOCK_LOW_CONTRAST 2.499
-score STOX_BOUND_090909_B 2.443
+score STOX_BOUND_090909_B 2.017
score SUBJ_OBFU_PUNCT_FEW 0.749
score SUBJ_OBFU_PUNCT_MANY 1.546
-score THIS_AD 0.197
-score THIS_IS_ADV_SUSP_NTLD 1.493
-score TONOM_EQ_TOLOC_SHRT_PSHRTNER 0.001
-score TONOM_EQ_TOLOC_SHRT_SHRTNER 0.001
-score TO_EQ_FM_DIRECT_MX 2.500
-score TO_EQ_FM_DOM_HTML_IMG 0.274
-score TO_EQ_FM_DOM_HTML_ONLY 1.594
-score TO_EQ_FM_DOM_SPF_FAIL 0.001
-score TO_EQ_FM_HTML_ONLY 1.299
-score TO_EQ_FM_SPF_FAIL 1.161
-score TO_IN_SUBJ 0.100
-score TO_NAME_SUBJ_NO_RDNS 2.262
-score TO_NO_BRKTS_FROM_MSSP 2.500
-score TO_NO_BRKTS_HTML_IMG 1.338
+score THIS_AD 0.195
+score THIS_IS_ADV_SUSP_NTLD 1.499
+score TONOM_EQ_TOLOC_SHRT_PSHRTNER 0.266
+score TONOM_EQ_TOLOC_SHRT_SHRTNER 0.791
+score TO_EQ_FM_DIRECT_MX 1.430
+score TO_EQ_FM_DOM_HTML_IMG 0.001 # force non-zero
+score TO_EQ_FM_DOM_HTML_ONLY 1.021
+score TO_EQ_FM_DOM_SPF_FAIL 0.823
+score TO_EQ_FM_HTML_ONLY 0.001
+score TO_EQ_FM_SPF_FAIL 0.719
+score TO_IN_SUBJ 0.099
+score TO_NAME_SUBJ_NO_RDNS 2.259
+score TO_NO_BRKTS_FROM_MSSP 2.499
+score TO_NO_BRKTS_HTML_IMG 1.994
score TO_NO_BRKTS_HTML_ONLY 1.999
-score TO_NO_BRKTS_MSFT 1.498
-score TO_NO_BRKTS_NORDNS_HTML 1.422
-score TO_NO_BRKTS_PCNT 2.375
+score TO_NO_BRKTS_MSFT 1.499
+score TO_NO_BRKTS_NORDNS_HTML 1.607
+score TO_NO_BRKTS_PCNT 2.365
score TVD_SPACE_ENCODED 0.001
score TVD_SPACE_RATIO_MINFP 2.499
score UNICODE_OBFU_ASC 2.499
-score UPGRADE_MAILBOX 1.528
-score UPPERCASE_URI 1.208
-score URI_GOOGLE_PROXY 2.499
+score UPGRADE_MAILBOX 1.457
+score URI_GOOGLE_PROXY 2.399
score URI_IMG_WP_REDIR 2.999
score URI_ONLY_MSGID_MALF 1.999
-score URI_PHISH 2.600
+score URI_PHISH 2.599
score URI_PHP_REDIR 3.499
-score URI_TRY_3LD 1.999
-score URI_WPADMIN 2.699
+score URI_TRY_3LD 2.000
+score URI_WPADMIN 2.700
score URI_WP_DIRINDEX 3.499
-score URI_WP_HACKED 2.300
-score URI_WP_HACKED_2 2.500
+score URI_WP_HACKED 3.499
+score URI_WP_HACKED_2 2.499
score XPRIO_SHORT_SUBJ 2.499
score XPRIO_URL_SHORTNER 0.999
score AC_HTML_NONSENSE_TAGS 1.000
@@ -279,7 +275,6 @@ score MANY_HDRS_LCASE 0.1
score MONERO_EXTORT_01 1.000
score NEWEGG_IMG_NOT_RCVD_NEGG 1.000
score OFFER_ONLY_AMERICA 1.000
-score PDS_DBL_URL_TNB_RUNON 1.000
score PHOTO_EDITING_DIRECT 1.000
score PHOTO_EDITING_FREEM 1.000
score PHP_NOVER_MUA 1.000

Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1877462&r1=1877461&r2=1877462&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Thu May 7 06:18:20 2020
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 907343 44.969% (99.539% of non-spam corpus)
-# Correctly spam: 534006 26.466% (48.276% of spam corpus)
-# False positives: 4201 0.208% (0.461% of nonspam, 146431 weighted)
-# False negatives: 572148 28.356% (51.724% of spam, 1258091 weighted)
-# Average score for spam: 5.8 nonspam: 0.6
-# Average for false-pos: 5.7 false-neg: 2.2
-# TOTAL: 2017698 100.00%
+# Correctly non-spam: 900779 43.689% (99.581% of non-spam corpus)
+# Correctly spam: 534245 25.911% (46.166% of spam corpus)
+# False positives: 3794 0.184% (0.419% of nonspam, 140717 weighted)
+# False negatives: 622992 30.216% (53.834% of spam, 1362632 weighted)
+# Average score for spam: 5.5 nonspam: 0.6
+# Average for false-pos: 5.8 false-neg: 2.2
+# TOTAL: 2061810 100.00%

Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 113131 99.44%
-# Correctly spam: 66519 48.20%
-# False positives: 635 0.56%
-# False negatives: 71491 51.80%
-# TCR(l=50): 1.336775 SpamRecall: 48.199% SpamPrec: 99.054%
+# Correctly non-spam: 112456 99.58%
+# Correctly spam: 66816 46.25%
+# False positives: 469 0.42%
+# False negatives: 77659 53.75%
+# TCR(l=50): 1.428903 SpamRecall: 46.247% SpamPrec: 99.303%

##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 898274 98.54%
-# Correctly spam: 371538 33.59%
-# False positives: 13270 1.46%
-# False negatives: 734616 66.41%
-# TCR(l=50): 0.791175 SpamRecall: 33.588% SpamPrec: 96.552%
+# Correctly non-spam: 891364 98.54%
+# Correctly spam: 373943 32.31%
+# False positives: 13209 1.46%
+# False negatives: 783294 67.69%
+# TCR(l=50): 0.801553 SpamRecall: 32.313% SpamPrec: 96.588%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 112100 98.54%
-# Correctly spam: 46361 33.59%
-# False positives: 1666 1.46%
-# False negatives: 91649 66.41%
-# TCR(l=50): 0.788858 SpamRecall: 33.592% SpamPrec: 96.531%
+# Correctly non-spam: 111300 98.56%
+# Correctly spam: 46570 32.23%
+# False positives: 1625 1.44%
+# False negatives: 97905 67.77%
+# TCR(l=50): 0.806425 SpamRecall: 32.234% SpamPrec: 96.628%

Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1877462&r1=1877461&r2=1877462&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Thu May 7 06:18:20 2020
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 865799 47.639% (97.901% of non-spam corpus)
-# Correctly spam: 641144 35.278% (68.715% of spam corpus)
-# False positives: 18563 1.021% (2.099% of nonspam, 1235908 weighted)
-# False negatives: 291899 16.061% (31.285% of spam, 992189 weighted)
-# Average score for spam: 11.1 nonspam: -1.8
-# Average for false-pos: 6.3 false-neg: 3.4
-# TOTAL: 1817405 100.00%
+# Correctly non-spam: 872901 48.031% (98.705% of non-spam corpus)
+# Correctly spam: 639086 35.165% (68.496% of spam corpus)
+# False positives: 11451 0.630% (1.295% of nonspam, 861388 weighted)
+# False negatives: 293943 16.174% (31.504% of spam, 1001999 weighted)
+# Average score for spam: 11.1 nonspam: -1.9
+# Average for false-pos: 7.1 false-neg: 3.4
+# TOTAL: 1817381 100.00%

Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 108043 97.88%
-# Correctly spam: 80234 68.90%
-# False positives: 2344 2.12%
-# False negatives: 36215 31.10%
-# TCR(l=50): 0.759046 SpamRecall: 68.901% SpamPrec: 97.161%
+# Correctly non-spam: 108908 98.66%
+# Correctly spam: 80164 68.84%
+# False positives: 1478 1.34%
+# False negatives: 36280 31.16%
+# TCR(l=50): 1.056852 SpamRecall: 68.843% SpamPrec: 98.190%

##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 880842 99.60%
-# Correctly spam: 423724 45.41%
+# Correctly non-spam: 880832 99.60%
+# Correctly spam: 423648 45.41%
# False positives: 3520 0.40%
-# False negatives: 509319 54.59%
-# TCR(l=50): 1.361473 SpamRecall: 45.413% SpamPrec: 99.176%
+# False negatives: 509381 54.59%
+# TCR(l=50): 1.361329 SpamRecall: 45.406% SpamPrec: 99.176%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...

# SUMMARY for threshold 5.0:
-# Correctly non-spam: 109945 99.60%
-# Correctly spam: 53142 45.64%
-# False positives: 442 0.40%
-# False negatives: 63307 54.36%
-# TCR(l=50): 1.363460 SpamRecall: 45.635% SpamPrec: 99.175%
+# Correctly non-spam: 109932 99.59%
+# Correctly spam: 53187 45.68%
+# False positives: 454 0.41%
+# False negatives: 63257 54.32%
+# TCR(l=50): 1.354677 SpamRecall: 45.676% SpamPrec: 99.154%