You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by sp...@apache.org on 2020/09/26 03:25:10 UTC
svn commit: r1882031 [2/2] - in /spamassassin/trunk/rulesrc/scores:
72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0
stats-set1
Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1882031&r1=1882030&r2=1882031&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Sat Sep 26 03:25:10 2020
@@ -3,190 +3,190 @@
score AC_BR_BONANZA 0.001
score AC_DIV_BONANZA 0.001
-score AC_FROM_MANY_DOTS 2.027
+score AC_FROM_MANY_DOTS 1.906
score AC_HTML_NONSENSE_TAGS 1.997
score AC_POST_EXTRAS 0.001
-score ADMITS_SPAM 0.001
+score ADMITS_SPAM 0.156
score ADVANCE_FEE_2_NEW_MONEY 1.997
-score ADVANCE_FEE_3_NEW_MONEY 2.696
-score ADVANCE_FEE_4_NEW_MONEY 2.198
+score ADVANCE_FEE_3_NEW_MONEY 1.477
+score ADVANCE_FEE_4_NEW_MONEY 2.197
score ADVANCE_FEE_5_NEW 2.896
-score AMAZON_IMG_NOT_RCVD_AMZN 0.301
+score AMAZON_IMG_NOT_RCVD_AMZN 0.993
score AXB_XMAILER_MIMEOLE_OL_024C2 0.001
-score BITCOIN_DEADLINE 2.996
-score BITCOIN_EXTORT_01 4.712
+score BITCOIN_DEADLINE 2.843
+score BITCOIN_EXTORT_01 4.766
score BITCOIN_MALF_HTML 3.496
-score BITCOIN_SPAM_02 2.038
+score BITCOIN_SPAM_02 1.532
score BITCOIN_SPAM_04 1.498
-score BITCOIN_SPAM_05 1.749
+score BITCOIN_SPAM_05 2.076
score BITCOIN_XPRIO 2.497
-score BITCOIN_YOUR_INFO 0.615
+score BITCOIN_YOUR_INFO 0.577
score BODY_URI_ONLY 0.001
score BOGUS_MIME_VERSION 3.496
-score CK_HELO_DYNAMIC_SPLIT_IP 0.593
+score CK_HELO_DYNAMIC_SPLIT_IP 0.314
score CK_HELO_GENERIC 0.248
-score CTE_8BIT_MISMATCH 0.998
-score CTYPE_NULL 2.394
+score CTE_8BIT_MISMATCH 0.999
+score CTYPE_NULL 2.621
score DKIMWL_BL 2.996
-score DKIMWL_WL_HIGH -1.199
-score DKIMWL_WL_MED -0.001
+score DKIMWL_WL_HIGH -1.200
+score DKIMWL_WL_MED -0.001 # force non-zero
score DOTGOV_IMAGE 2.996
score DSN_NO_MIMEVERSION 1.997
score DX_TEXT_03 0.898
-score END_FUTURE_EMAILS 1.048
-score FILL_THIS_FORM 0.455
+score END_FUTURE_EMAILS 1.044
+score FILL_THIS_FORM 1.394
score FONT_INVIS_DIRECT 0.001
score FONT_INVIS_DOTGOV 0.001
-score FONT_INVIS_LONG_LINE 0.009
+score FONT_INVIS_LONG_LINE 0.010
score FONT_INVIS_MSGID 0.001
-score FONT_INVIS_POSTEXTRAS 2.019
+score FONT_INVIS_POSTEXTRAS 3.415
score FORGED_RELAY_MUA_TO_MX 3.995
-score FORGED_SPF_HELO 1.997
-score FORM_FRAUD 0.999
-score FORM_FRAUD_5 2.896
+score FORGED_SPF_HELO 2.097
+score FORM_FRAUD 0.998
+score FORM_FRAUD_5 2.996
score FOUND_YOU 3.246
-score FREEMAIL_FORGED_FROMDOMAIN 0.001
-score FROM_2_EMAILS_SHORT 0.729
-score FROM_ADDR_WS 2.996
+score FREEMAIL_FORGED_FROMDOMAIN 0.001 # force non-zero
+score FROM_2_EMAILS_SHORT 0.631
+score FROM_ADDR_WS 2.816
score FROM_FMBLA_NEWDOM 1.498
-score FROM_FMBLA_NEWDOM14 0.998
+score FROM_FMBLA_NEWDOM14 0.999
score FROM_FMBLA_NEWDOM28 0.798
-score FROM_GOV_DKIM_AU -0.001
+score FROM_GOV_DKIM_AU -0.998
score FROM_GOV_SPOOF 0.998
score FROM_MISSPACED 0.001
score FROM_MISSP_DYNIP 1.660
score FROM_MISSP_EH_MATCH 0.001
-score FROM_MISSP_FREEMAIL 2.305
+score FROM_MISSP_FREEMAIL 0.651
score FROM_MISSP_MSFT 0.001
-score FROM_MISSP_REPLYTO 0.001
-score FROM_MISSP_SPF_FAIL 1.999
-score FROM_MISSP_TO_UNDISC 0.322
+score FROM_MISSP_REPLYTO 0.001 # force non-zero
+score FROM_MISSP_SPF_FAIL 1.997
+score FROM_MISSP_TO_UNDISC 1.596
score FROM_MISSP_USER 0.001
score FROM_MISSP_XPRIO 0.001
score FROM_NAME_EQ_TO_G_DRIVE 0.001
score FROM_NTLD_REPLY_FREEMAIL 0.001
score FROM_SUSPICIOUS_NTLD 0.498
-score FROM_SUSPICIOUS_NTLD_FP 1.156
-score FROM_UNBAL1 2.186
-score FROM_WORDY 1.970
+score FROM_SUSPICIOUS_NTLD_FP 1.075
+score FROM_UNBAL1 2.381
+score FROM_WORDY 2.092
score FSL_BULK_SIG 0.001
score FSL_CTYPE_WIN1251 0.001
score FSL_NEW_HELO_USER 0.001
-score FSL_THIS_IS_ADV 0.647
+score FSL_THIS_IS_ADV 0.487
score GB_FREEMAIL_DISPTO 0.001
score GB_GOOGLE_OBFUS 0.748
-score HDRS_LCASE 0.098
+score HDRS_LCASE 0.099
score HDRS_LCASE_IMGONLY 0.099
-score HDR_ORDER_FTSDMCXX_DIRECT 0.810
-score HDR_ORDER_FTSDMCXX_NORDNS 0.723
-score HEADER_FROM_DIFFERENT_DOMAINS 0.248
-score HELO_MISC_IP 0.027
+score HDR_ORDER_FTSDMCXX_DIRECT 0.821
+score HDR_ORDER_FTSDMCXX_NORDNS 0.581
+score HEADER_FROM_DIFFERENT_DOMAINS 0.249
+score HELO_MISC_IP 0.149
score HELO_NO_DOMAIN 0.001
score HK_RANDOM_FROM 0.001
score HK_RANDOM_REPLYTO 0.998
-score HK_SCAM 1.100
-score HOSTED_IMG_DIRECT_MX 1.584
+score HK_SCAM 0.897
+score HOSTED_IMG_DIRECT_MX 2.116
score HTML_OFF_PAGE 0.001
-score HTML_SINGLET_MANY 0.973
+score HTML_SINGLET_MANY 0.001
score HTML_TEXT_INVISIBLE_FONT 2.996
-score HTML_TEXT_INVISIBLE_STYLE 2.982
+score HTML_TEXT_INVISIBLE_STYLE 2.744
score IMG_ONLY_FM_DOM_INFO 2.497
-score KB_FORGED_MOZ4 2.963
-score KHOP_FAKE_EBAY 0.473
-score KHOP_HELO_FCRDNS 0.275
-score LH_URI_DOM_IN_PATH 2.175
-score LIST_PRTL_SAME_USER 0.456
-score LONG_HEX_URI 1.686
-score LONG_IMG_URI 0.919
-score LONG_INVISIBLE_TEXT 1.849
+score KB_FORGED_MOZ4 2.470
+score KHOP_FAKE_EBAY 0.228
+score KHOP_HELO_FCRDNS 0.274
+score LH_URI_DOM_IN_PATH 2.331
+score LIST_PRTL_SAME_USER 0.978
+score LONG_HEX_URI 1.580
+score LONG_IMG_URI 1.738
+score LONG_INVISIBLE_TEXT 1.850
score LOTS_OF_MONEY 0.010
-score MANY_SPAN_IN_TEXT 1.435
-score MILLION_HUNDRED 0.536
-score MIMEOLE_DIRECT_TO_MX 0.001
+score MANY_SPAN_IN_TEXT 1.436
+score MILLION_HUNDRED 0.535
+score MIMEOLE_DIRECT_TO_MX 0.001 # force non-zero
score MIME_NO_TEXT 0.001
score MIXED_ES 2.696
-score MONEY_FORM_SHORT 1.513
-score MONEY_FRAUD_3 0.870
-score MONEY_FRAUD_5 0.488
-score MONEY_FRAUD_8 0.771
+score MONEY_FORM_SHORT 0.001
+score MONEY_FRAUD_3 0.873
+score MONEY_FRAUD_5 1.036
+score MONEY_FRAUD_8 1.983
score MONEY_FROM_MISSP 1.997
-score MSM_PRIO_REPTO 2.272
-score NICE_REPLY_A -0.238
-score NORDNS_LOW_CONTRAST 1.056
+score MSM_PRIO_REPTO 2.168
+score NICE_REPLY_A -0.213
+score NORDNS_LOW_CONTRAST 1.132
score NO_FM_NAME_IP_HOSTN 0.001
score NSL_RCVD_FROM_USER 0.001
-score NSL_RCVD_HELO_USER 1.710
-score PDS_BTC_ID 0.499
-score PDS_BTC_MSGID 0.001 # force non-zero
-score PDS_EMPTYSUBJ_URISHRT 0.001
+score NSL_RCVD_HELO_USER 1.415
+score PDS_BTC_ID 0.498
+score PDS_BTC_MSGID 0.001
+score PDS_EMPTYSUBJ_URISHRT 0.161
score PDS_FREEMAIL_REPLYTO_URISHRT 1.498
score PDS_FRNOM_TODOM_NAKED_TO 1.498
-score PDS_FROM_2_EMAILS 1.997
+score PDS_FROM_2_EMAILS 2.097
score PDS_FROM_NAME_TO_DOMAIN 0.998
score PDS_NAKED_TO_NUMERO 1.997
-score PDS_SHORTFWD_URISHRT 1.223
-score PDS_TINYSUBJ_URISHRT 1.272
-score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 1.496
+score PDS_SHORTFWD_URISHRT 1.498
+score PDS_TINYSUBJ_URISHRT 1.270
+score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 0.971
score PDS_TONAME_EQ_TOLOCAL_HDRS_LCASE 1.997
score PDS_TONAME_EQ_TOLOCAL_VSHORT 0.998
score PDS_TO_EQ_FROM_NAME 0.001
score PHP_ORIG_SCRIPT 2.497
score PP_MIME_FAKE_ASCII_TEXT 0.998
-score RATWARE_NO_RDNS 1.354
+score RATWARE_NO_RDNS 1.668
score RCVD_IN_MSPIKE_H2 -0.001
score RISK_FREE 2.896
-score SENDGRID_REDIR 1.499
-score SENDGRID_REDIR_PHISH 3.454
-score SERGIO_SUBJECT_VIAGRA01 2.622
+score SENDGRID_REDIR 1.498
+score SENDGRID_REDIR_PHISH 3.499
+score SERGIO_SUBJECT_VIAGRA01 2.628
score SHORTENED_URL_SRC 2.996
-score SHORTENER_SHORT_IMG 0.287
-score SHORT_BODY_G_DRIVE_DYN 0.519
+score SHORTENER_SHORT_IMG 0.009
+score SHORT_BODY_G_DRIVE_DYN 0.545
score SHORT_SHORTNER 1.997
score SINGLETS_LOW_CONTRAST 0.001
score SPOOFED_FREEMAIL 1.997
-score SPOOFED_FREEMAIL_NO_RDNS 0.274
-score SPOOFED_FREEM_REPTO 1.975
-score SPOOFED_FREEM_REPTO_CHN 0.630
+score SPOOFED_FREEMAIL_NO_RDNS 0.527
+score SPOOFED_FREEM_REPTO 1.995
+score SPOOFED_FREEM_REPTO_CHN 2.477
score STATIC_XPRIO_OLE 1.997
-score STOCK_LOW_CONTRAST 0.212
+score STOCK_LOW_CONTRAST 0.190
score SUBJ_OBFU_PUNCT_FEW 0.748
score SUBJ_OBFU_PUNCT_MANY 1.747
-score SUSP_UTF8_WORD_COMBO 0.462
+score SUSP_UTF8_WORD_COMBO 0.389
score SUSP_UTF8_WORD_FROM 1.997
score SUSP_UTF8_WORD_SUBJ 1.997
score THIS_AD 1.398
-score TONOM_EQ_TOLOC_SHRT_SHRTNER 1.315
-score TO_EQ_FM_DOM_HTML_IMG 0.632
-score TO_EQ_FM_DOM_HTML_ONLY 1.701
+score TONOM_EQ_TOLOC_SHRT_SHRTNER 1.266
+score TO_EQ_FM_DOM_HTML_IMG 0.267
+score TO_EQ_FM_DOM_HTML_ONLY 1.603
score TO_EQ_FM_DOM_SPF_FAIL 0.001
-score TO_EQ_FM_HTML_ONLY 0.829
-score TO_EQ_FM_SPF_FAIL 1.824
-score TO_IN_SUBJ 0.098
+score TO_EQ_FM_HTML_ONLY 0.772
+score TO_EQ_FM_SPF_FAIL 1.732
+score TO_IN_SUBJ 0.099
score TO_NO_BRKTS_FROM_MSSP 2.497
-score TO_NO_BRKTS_HTML_IMG 1.787
-score TO_NO_BRKTS_HTML_ONLY 1.998
-score TO_NO_BRKTS_MSFT 2.335
+score TO_NO_BRKTS_HTML_IMG 1.785
+score TO_NO_BRKTS_HTML_ONLY 1.997
+score TO_NO_BRKTS_MSFT 2.326
score TO_NO_BRKTS_NORDNS_HTML 1.997
-score TVD_RCVD_SPACE_BRACKET 4.299
+score TVD_RCVD_SPACE_BRACKET 4.138
score TVD_SPACE_ENCODED 0.001
score TVD_SPACE_RATIO_MINFP 0.001
-score UPGRADE_MAILBOX 1.797
+score UPGRADE_MAILBOX 1.897
score URI_DOTEDU 0.001
score URI_DOTEDU_ENTITY 2.996
-score URI_DOTEDU_LONG 0.001 # force non-zero
-score URI_GOOGLE_PROXY 0.375
+score URI_DOTEDU_LONG 0.001
+score URI_GOOGLE_PROXY 0.212
score URI_IMG_WP_REDIR 2.996
-score URI_IN_URI_10 1.290
-score URI_IN_URI_5 2.557
-score URI_ONLY_MSGID_MALF 0.860
-score URI_PHISH 3.151
+score URI_IN_URI_10 2.342
+score URI_IN_URI_5 2.211
+score URI_ONLY_MSGID_MALF 0.932
+score URI_PHISH 3.095
score URI_PHP_REDIR 3.496
-score URI_TRY_3LD 1.995
+score URI_TRY_3LD 1.707
score URI_WPADMIN 2.696
-score URI_WP_DIRINDEX 2.820
+score URI_WP_DIRINDEX 2.666
score URI_WP_HACKED 3.496
-score URI_WP_HACKED_2 2.497
-score XPRIO_SHORT_SUBJ 1.445
+score URI_WP_HACKED_2 2.498
+score XPRIO_SHORT_SUBJ 1.444
score AC_SPAMMY_URI_PATTERNS1 1.000
score AC_SPAMMY_URI_PATTERNS10 1.000
score AC_SPAMMY_URI_PATTERNS11 1.000
Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1882031&r1=1882030&r2=1882031&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Sat Sep 26 03:25:10 2020
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 849841 50.787% (99.480% of non-spam corpus)
-# Correctly spam: 667031 39.862% (81.439% of spam corpus)
-# False positives: 4441 0.265% (0.520% of nonspam, 140468 weighted)
-# False negatives: 152020 9.085% (18.561% of spam, 387374 weighted)
-# Average score for spam: 8.5 nonspam: 0.5
-# Average for false-pos: 6.6 false-neg: 2.5
-# TOTAL: 1673333 100.00%
+# Correctly non-spam: 851368 52.911% (99.595% of non-spam corpus)
+# Correctly spam: 607320 37.744% (80.521% of spam corpus)
+# False positives: 3463 0.215% (0.405% of nonspam, 107634 weighted)
+# False negatives: 146920 9.131% (19.479% of spam, 371661 weighted)
+# Average score for spam: 8.7 nonspam: 0.5
+# Average for false-pos: 7.0 false-neg: 2.5
+# TOTAL: 1609071 100.00%
Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 106022 99.50%
-# Correctly spam: 83349 81.61%
-# False positives: 531 0.50%
-# False negatives: 18778 18.39%
-# TCR(l=50): 2.253067 SpamRecall: 81.613% SpamPrec: 99.367%
+# Correctly non-spam: 106025 99.43%
+# Correctly spam: 75843 80.65%
+# False positives: 605 0.57%
+# False negatives: 18192 19.35%
+# TCR(l=50): 1.941187 SpamRecall: 80.654% SpamPrec: 99.209%
##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 845709 99.00%
-# Correctly spam: 267015 32.60%
-# False positives: 8573 1.00%
-# False negatives: 552036 67.40%
-# TCR(l=50): 0.835182 SpamRecall: 32.601% SpamPrec: 96.889%
+# Correctly non-spam: 846280 99.00%
+# Correctly spam: 246418 32.67%
+# False positives: 8551 1.00%
+# False negatives: 507822 67.33%
+# TCR(l=50): 0.806353 SpamRecall: 32.671% SpamPrec: 96.646%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 105489 99.00%
-# Correctly spam: 33230 32.54%
-# False positives: 1064 1.00%
-# False negatives: 68897 67.46%
-# TCR(l=50): 0.836442 SpamRecall: 32.538% SpamPrec: 96.897%
+# Correctly non-spam: 105554 98.99%
+# Correctly spam: 30506 32.44%
+# False positives: 1076 1.01%
+# False negatives: 63529 67.56%
+# TCR(l=50): 0.801464 SpamRecall: 32.441% SpamPrec: 96.593%
Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1882031&r1=1882030&r2=1882031&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Sat Sep 26 03:25:10 2020
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 852983 45.003% (99.667% of non-spam corpus)
-# Correctly spam: 974384 51.408% (93.729% of spam corpus)
-# False positives: 2849 0.150% (0.333% of nonspam, 269580 weighted)
-# False negatives: 65191 3.439% (6.271% of spam, 134585 weighted)
+# Correctly non-spam: 853130 45.012% (99.685% of non-spam corpus)
+# Correctly spam: 975154 51.450% (93.810% of spam corpus)
+# False positives: 2699 0.142% (0.315% of nonspam, 261186 weighted)
+# False negatives: 64342 3.395% (6.190% of spam, 130938 weighted)
# Average score for spam: 14.3 nonspam: -1.4
-# Average for false-pos: 7.8 false-neg: 2.1
-# TOTAL: 1895407 100.00%
+# Average for false-pos: 8.0 false-neg: 2.0
+# TOTAL: 1895325 100.00%
Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 106375 99.64%
-# Correctly spam: 121871 93.91%
-# False positives: 387 0.36%
-# False negatives: 7904 6.09%
-# TCR(l=50): 4.761686 SpamRecall: 93.909% SpamPrec: 99.683%
+# Correctly non-spam: 106370 99.63%
+# Correctly spam: 121814 93.87%
+# False positives: 392 0.37%
+# False negatives: 7948 6.13%
+# TCR(l=50): 4.710396 SpamRecall: 93.875% SpamPrec: 99.679%
##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 852518 99.61%
-# Correctly spam: 605835 58.28%
-# False positives: 3314 0.39%
-# False negatives: 433740 41.72%
-# TCR(l=50): 1.734244 SpamRecall: 58.277% SpamPrec: 99.456%
+# Correctly non-spam: 852494 99.61%
+# Correctly spam: 605998 58.30%
+# False positives: 3335 0.39%
+# False negatives: 433498 41.70%
+# TCR(l=50): 1.731778 SpamRecall: 58.297% SpamPrec: 99.453%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 106336 99.60%
-# Correctly spam: 75626 58.27%
-# False positives: 426 0.40%
-# False negatives: 54149 41.73%
-# TCR(l=50): 1.720036 SpamRecall: 58.275% SpamPrec: 99.440%
+# Correctly non-spam: 106365 99.63%
+# Correctly spam: 75532 58.21%
+# False positives: 397 0.37%
+# False negatives: 54230 41.79%
+# TCR(l=50): 1.751647 SpamRecall: 58.208% SpamPrec: 99.477%