You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by sp...@apache.org on 2023/05/11 02:40:12 UTC
svn commit: r1909735 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1
Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1909735&r1=1909734&r2=1909735&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Thu May 11 02:40:12 2023
@@ -1,196 +1,197 @@
# Using score set 1 logs for revision 1909647 from:
# ham-net-ena-week0.r1909647.log ham-net-ena-week1.r1909647.log ham-net-ena-week2.r1909647.log ham-net-ena-week3.r1909647.log ham-net-ena-week4.r1909647.log ham-net-giovanni-ham.r1909647.log ham-net-giovanni-spammy.r1909647.log ham-net-giovanni-spam.r1909647.log ham-net-grenier.r1909647.log ham-net-hege.r1909647.log ham-net-jhardin.r1909647.log ham-net-llanga.r1909647.log ham-net-mmiroslaw-mails-ham.r1909647.log ham-net-mmiroslaw-mails-spam.r1909647.log ham-net-spamsponge.r1909647.log ham-net-thendrikx.r1909647.log spam-net-ena-week0.r1909647.log spam-net-ena-week1.r1909647.log spam-net-ena-week2.r1909647.log spam-net-ena-week3.r1909647.log spam-net-ena-week4.r1909647.log spam-net-giovanni-ham.r1909647.log spam-net-giovanni-spammy.r1909647.log spam-net-giovanni-spam.r1909647.log spam-net-grenier.r1909647.log spam-net-hege.r1909647.log spam-net-jhardin.r1909647.log spam-net-llanga.r1909647.log spam-net-mmiroslaw-mails-ham.r1909647.log spam-net-mmiroslaw-mails-spam.r1909647.log spam-n
et-spamsponge.r1909647.log spam-net-thendrikx.r1909647.log
-score ACCT_PHISHING_MANY 3.000
+score ACCT_PHISHING_MANY 2.999
score AC_BR_BONANZA 0.001
score AC_DIV_BONANZA 0.001
score AC_FROM_MANY_DOTS 2.999
-score AC_HTML_NONSENSE_TAGS 1.915
+score AC_HTML_NONSENSE_TAGS 1.916
score ADMITS_SPAM 0.001
-score ADVANCE_FEE_2_NEW_MONEY 1.999
+score ADVANCE_FEE_2_NEW_MONEY 2.000
score ADVANCE_FEE_3_NEW 3.499
-score ADVANCE_FEE_3_NEW_FRM_MNY 0.544
+score ADVANCE_FEE_3_NEW_FRM_MNY 0.601
score ADVANCE_FEE_3_NEW_MONEY 2.299
score ADVANCE_FEE_4_NEW_FRM_MNY 0.001
-score ADVANCE_FEE_4_NEW_MONEY 2.243
-score ADVANCE_FEE_5_NEW_FRM_MNY 0.892
+score ADVANCE_FEE_4_NEW_MONEY 2.399
+score ADVANCE_FEE_5_NEW_FRM_MNY 1.212
score ADVANCE_FEE_5_NEW_MONEY 0.001
-score AD_PREFS 0.469
+score AD_PREFS 0.430
score AMAZON_IMG_NOT_RCVD_AMZN 0.001
score AXB_XMAILER_MIMEOLE_OL_024C2 0.001
score BITCOIN_DEADLINE 2.999
-score BITCOIN_MALF_HTML 1.483
-score BITCOIN_MALWARE 2.234
+score BITCOIN_MALF_HTML 1.494
+score BITCOIN_MALWARE 1.977
score BITCOIN_OBFU_SUBJ 1.765
-score BITCOIN_SPAM_02 1.535
+score BITCOIN_SPAM_02 2.303
score BITCOIN_SPAM_07 3.499
-score BITCOIN_XPRIO 2.300
-score BITCOIN_YOUR_INFO 2.839
-score BODY_SINGLE_URI 0.465
+score BITCOIN_XPRIO 2.197
+score BITCOIN_YOUR_INFO 2.532
+score BODY_SINGLE_URI 0.425
score BODY_SINGLE_WORD 0.001
-score BODY_URI_ONLY 2.026
+score BODY_URI_ONLY 2.066
score CK_HELO_GENERIC 0.249
-score CTE_8BIT_MISMATCH 0.001
-score DATE_IN_FUTURE_Q_PLUS 2.400
-score DEAR_BENEFICIARY 1.666
+score CTE_8BIT_MISMATCH 0.001 # force non-zero
+score DATE_IN_FUTURE_Q_PLUS 2.399
+score DEAR_BENEFICIARY 2.538
score DKIMWL_WL_HIGH -0.001
score DKIMWL_WL_MED -0.001 # force non-zero
score DKIMWL_WL_MEDHI -0.001
score END_FUTURE_EMAILS 2.499
-score FILL_THIS_FORM 0.599
+score FILL_THIS_FORM 0.600
score FONT_INVIS_DIRECT 0.001
score FONT_INVIS_LONG_LINE 2.999
-score FONT_INVIS_MSGID 0.880
-score FONT_INVIS_POSTEXTRAS 0.914
-score FORGED_SPF_HELO 1.800
+score FONT_INVIS_MSGID 0.911
+score FONT_INVIS_POSTEXTRAS 0.752
+score FORGED_SPF_HELO 1.799
score FORM_FRAUD 0.999
score FORM_FRAUD_5 0.001
-score FREEMAIL_FORGED_FROMDOMAIN 0.250
+score FREEMAIL_FORGED_FROMDOMAIN 0.249
score FROM_ADDR_WS 2.999
-score FROM_FMBLA_NEWDOM14 0.001 # force non-zero
+score FROM_FMBLA_NEWDOM14 0.001
score FROM_FMBLA_NEWDOM28 0.799
-score FROM_GOV_DKIM_AU -0.435
+score FROM_GOV_DKIM_AU -0.206
score FROM_IN_TO_AND_SUBJ 1.799
-score FROM_MISSPACED 0.540
-score FROM_MISSP_EH_MATCH 1.853
-score FROM_MISSP_FREEMAIL 2.696
+score FROM_MISSPACED 0.458
+score FROM_MISSP_EH_MATCH 1.935
+score FROM_MISSP_FREEMAIL 2.614
score FROM_MISSP_MSFT 0.001
-score FROM_MISSP_REPLYTO 2.143
-score FROM_MISSP_SPF_FAIL 0.001
+score FROM_MISSP_REPLYTO 2.146
+score FROM_MISSP_SPF_FAIL 0.001 # force non-zero
score FROM_MISSP_USER 0.001
-score FROM_PAYPAL_SPOOF 0.001
-score FROM_SUSPICIOUS_NTLD 0.191
-score FROM_SUSPICIOUS_NTLD_FP 2.000
+score FROM_PAYPAL_SPOOF 0.965
+score FROM_SUSPICIOUS_NTLD 0.190
+score FROM_SUSPICIOUS_NTLD_FP 1.999
score FSL_BULK_SIG 0.001
score FSL_CTYPE_WIN1251 0.001
-score FSL_NEW_HELO_USER 0.001
-score FUZZY_AMAZON 0.001
+score FSL_NEW_HELO_USER 0.001 # force non-zero
+score FUZZY_AMAZON 0.001 # force non-zero
score GB_CUSTOM_HTM_URI 0.835
-score GB_FAKE_RF_SHORT 1.999
+score GB_FAKE_RF_SHORT 2.000
score GB_FREEMAIL_DISPTO 0.001
-score GB_GOOGLE_TRANSL 0.589
-score GB_HASHBL_BTC 4.902
+score GB_GOOGLE_TRANSL 0.587
+score GB_HASHBL_BTC 4.699
score GOOG_REDIR_HTML_ONLY 1.999
score GOOG_REDIR_NORDNS 2.899
-score GOOG_STO_NOIMG_HTML 2.950
-score HAS_X_OUTGOING_SPAM_STAT 0.794
-score HDRS_MISSP 0.778
+score GOOG_STO_NOIMG_HTML 2.946
+score HAS_X_OUTGOING_SPAM_STAT 0.797
+score HDRS_MISSP 0.768
score HDR_ORDER_FTSDMCXX_DIRECT 0.001
-score HDR_ORDER_FTSDMCXX_NORDNS 0.001 # force non-zero
-score HEADER_FROM_DIFFERENT_DOMAINS 0.249
-score HELO_NO_DOMAIN 0.001
+score HDR_ORDER_FTSDMCXX_NORDNS 0.001
+score HEADER_FROM_DIFFERENT_DOMAINS 0.250
+score HELO_NO_DOMAIN 0.006
score HK_NAME_MR_MRS 0.999
score HK_RANDOM_ENVFROM 0.001
score HK_RANDOM_FROM 0.001
score HK_RANDOM_REPLYTO 0.999
-score HK_SCAM 0.416
+score HK_SCAM 0.428
score HOSTED_IMG_DIRECT_MX 0.001
-score HOSTED_IMG_FREEM 2.088
+score HOSTED_IMG_FREEM 2.079
score HTML_FONT_TINY_NORDNS 0.001
score HTML_OFF_PAGE 0.001
-score HTML_TAG_BALANCE_CENTER 2.521
-score HTML_TEXT_INVISIBLE_FONT 1.500
-score HTML_TEXT_INVISIBLE_STYLE 0.001 # force non-zero
-score JH_SPAMMY_HEADERS 3.499
+score HTML_TAG_BALANCE_CENTER 2.494
+score HTML_TEXT_INVISIBLE_FONT 1.514
+score HTML_TEXT_INVISIBLE_STYLE 0.001
+score JH_SPAMMY_HEADERS 3.500
score KHOP_HELO_FCRDNS 0.001
-score LONG_HEX_URI 2.999
-score LONG_IMG_URI 0.001 # force non-zero
-score LONG_INVISIBLE_TEXT 1.826
+score LONG_HEX_URI 3.000
+score LONG_IMG_URI 0.001
+score LONG_INVISIBLE_TEXT 1.827
score LOTS_OF_MONEY 0.010
-score MALWARE_NORDNS 0.776
-score MALWARE_PASSWORD 0.428
+score MALWARE_NORDNS 3.238
+score MALWARE_PASSWORD 1.251
score MANY_SPAN_IN_TEXT 2.199
score MILLION_HUNDRED 0.001
-score MILLION_USD 1.999
-score MIMEOLE_DIRECT_TO_MX 0.001
+score MILLION_USD 1.046
+score MIMEOLE_DIRECT_TO_MX 0.001 # force non-zero
score MIME_NO_TEXT 1.999
-score MIXED_CENTER_CASE 2.492
-score MIXED_ES 0.772
-score MIXED_HREF_CASE 0.690
-score MONEY_ATM_CARD 0.001
+score MIXED_CENTER_CASE 2.218
+score MIXED_ES 0.768
+score MIXED_HREF_CASE 1.790
+score MONEY_ATM_CARD 1.874
score MONEY_FORM 0.001
score MONEY_FORM_SHORT 0.001
score MONEY_FRAUD_3 0.001
-score MONEY_FRAUD_5 2.263
-score MONEY_FRAUD_8 0.012
-score MONEY_FREEMAIL_REPTO 2.132
+score MONEY_FRAUD_5 2.261
+score MONEY_FRAUD_8 0.001
+score MONEY_FREEMAIL_REPTO 2.136
score MONEY_FROM_MISSP 0.001
-score MSMAIL_PRI_ABNORMAL 1.280
+score MSMAIL_PRI_ABNORMAL 0.302
score NA_DOLLARS 0.495
-score NICE_REPLY_A -3.251
+score NICE_REPLY_A -2.124
score NO_FM_NAME_IP_HOSTN 0.001
score NSL_RCVD_FROM_USER 0.001
-score NSL_RCVD_HELO_USER 0.001
-score OBFU_TEXT_ATTACH 0.935
-score PDS_BAD_THREAD_QP_64 1.000
-score PDS_BTC_ID 0.001
-score PDS_BTC_MSGID 0.438
-score PDS_EMPTYSUBJ_URISHRT 0.783
-score PDS_FRNOM_TODOM_DBL_URL 1.499
+score NSL_RCVD_HELO_USER 0.001 # force non-zero
+score OBFU_TEXT_ATTACH 0.540
+score PDS_BAD_THREAD_QP_64 0.999
+score PDS_BTC_ID 0.203
+score PDS_BTC_MSGID 0.999
+score PDS_EMPTYSUBJ_URISHRT 0.824
+score PDS_FRNOM_TODOM_DBL_URL 1.421
score PDS_FRNOM_TODOM_NAKED_TO 1.499
-score PDS_FROM_2_EMAILS_SHRTNER 1.312
+score PDS_FROM_2_EMAILS_SHRTNER 1.177
score PDS_FROM_NAME_TO_DOMAIN 1.999
-score PDS_HELO_SPF_FAIL 0.001
+score PDS_HELO_SPF_FAIL 1.069
score PDS_NO_FULL_NAME_SPOOFED_URL 0.749
score PDS_SHORT_SPOOFED_URL 1.999
score PDS_TINYSUBJ_URISHRT 1.499
score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 0.001
-score PHP_SCRIPT 2.499
+score PHP_SCRIPT 2.500
score POSSIBLE_AMAZON_PHISH_02 2.299
-score POSSIBLE_GMAIL_PHISHER 1.590
+score POSSIBLE_GMAIL_PHISHER 2.238
score PP_MIME_FAKE_ASCII_TEXT 0.001
-score RAND_HEADER_MANY 1.969
-score RAND_MKTG_HEADER 1.999
+score RAND_HEADER_MANY 1.966
+score RAND_MKTG_HEADER 2.000
score RATWARE_NO_RDNS 0.001
score RCVD_IN_MSPIKE_H2 -0.001 # force non-zero
-score SCC_BODY_SINGLE_WORD 0.001
+score SCC_BODY_SINGLE_WORD 0.001 # force non-zero
score SCC_ISEMM_LID_1B 1.499
-score SENDGRID_REDIR 0.790
+score SENDGRID_REDIR 0.789
score SERGIO_SUBJECT_VIAGRA01 0.001
score SHOPIFY_IMG_NOT_RCVD_SFY 2.499
score SHORT_SHORTNER 1.999
score SPOOFED_FREEMAIL 0.001 # force non-zero
score SPOOFED_FREEMAIL_NO_RDNS 0.001
-score SPOOFED_FREEM_REPTO 0.001 # force non-zero
+score SPOOFED_FREEM_REPTO 0.001
score SPOOF_GMAIL_MID 0.001
-score STATIC_XPRIO_OLE 1.861
-score STOX_BOUND_090909_B 3.202
-score SUSP_UTF8_WORD_COMBO 1.464
-score SUSP_UTF8_WORD_SUBJ 1.899
+score STATIC_XPRIO_OLE 1.862
+score STOX_BOUND_090909_B 1.877
+score SUSP_UTF8_WORD_COMBO 1.458
+score SUSP_UTF8_WORD_SUBJ 1.900
score THIS_AD 0.799
-score TONOM_EQ_TOLOC_SHRT_SHRTNER 0.401
-score TO_EQ_FM_DIRECT_MX 0.254
+score TONOM_EQ_TOLOC_SHRT_SHRTNER 0.396
+score TO_EQ_FM_DIRECT_MX 0.246
+score TO_EQ_FM_DOM_HTML_ONLY 1.823
score TO_EQ_FM_DOM_SPF_FAIL 0.001
score TO_EQ_FM_SPF_FAIL 0.001
score TO_IN_SUBJ 0.099
score TO_NAME_SUBJ_NO_RDNS 2.999
-score TO_NO_BRKTS_FROM_MSSP 2.500
+score TO_NO_BRKTS_FROM_MSSP 2.499
score TO_NO_BRKTS_HTML_IMG 1.999
score TO_NO_BRKTS_HTML_ONLY 1.999
score TO_NO_BRKTS_MSFT 0.001
-score TO_NO_BRKTS_NORDNS_HTML 1.822
+score TO_NO_BRKTS_NORDNS_HTML 1.824
score TO_NO_BRKTS_PCNT 2.499
score TR_JS_REDIRECTION_0 2.199
score TVD_SPACE_ENCODED 0.001
-score TVD_SPACE_RATIO_MINFP 0.001
+score TVD_SPACE_RATIO_MINFP 0.001 # force non-zero
score UNDISC_FREEM 2.699
score UNDISC_MONEY 2.899
score UNICODE_OBFU_ASC 2.499
score URI_DOTEDU 1.999
-score URI_GOOGLE_PROXY 2.400
+score URI_GOOGLE_PROXY 2.399
score URI_MALWARE_BH 0.999
-score URI_ONLY_MSGID_MALF 0.419
-score URI_PHISH 3.797
+score URI_ONLY_MSGID_MALF 1.243
+score URI_PHISH 3.625
score URI_TRY_3LD 1.999
-score URI_WP_HACKED 0.769
-score URI_WP_HACKED_2 2.499
+score URI_WP_HACKED 0.770
+score URI_WP_HACKED_2 2.500
score VFY_ACCT_NORDNS 0.001
-score WORD_INVIS 0.809
+score WORD_INVIS 0.807
score WORD_INVIS_MANY 2.999
score XFER_LOTSA_MONEY 0.001 # force non-zero
score XM_RANDOM 0.001
score XPRIO 0.001
-score YOU_INHERIT 1.682
+score YOU_INHERIT 0.266
score AC_POST_EXTRAS 1.000
score AC_SPAMMY_URI_PATTERNS1 1.000
score AC_SPAMMY_URI_PATTERNS10 1.000
@@ -280,6 +281,7 @@ score GOOG_STO_HTML_PHISH_MANY 1.0
score GOOG_STO_IMG_HTML 1.000
score GOOG_STO_IMG_NOHTML 1.000
score HAS_X_NO_RELAY 1.000
+score HDRS_LCASE 0.100
score HEXHASH_WORD 1.000
score HK_CTE_RAW 1.000
score HK_LOTTO 1.000
Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1909735&r1=1909734&r2=1909735&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Thu May 11 02:40:12 2023
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 341130 80.292% (99.361% of non-spam corpus)
-# Correctly spam: 48245 11.355% (59.168% of spam corpus)
-# False positives: 2194 0.516% (0.639% of nonspam, 17170 weighted)
-# False negatives: 33294 7.836% (40.832% of spam, 51688 weighted)
-# Average score for spam: 9.4 nonspam: 0.5
-# Average for false-pos: 6.6 false-neg: 1.6
-# TOTAL: 424863 100.00%
+# Correctly non-spam: 346810 80.594% (99.391% of non-spam corpus)
+# Correctly spam: 49033 11.395% (60.251% of spam corpus)
+# False positives: 2126 0.494% (0.609% of nonspam, 16574 weighted)
+# False negatives: 32348 7.517% (39.749% of spam, 48728 weighted)
+# Average score for spam: 9.3 nonspam: 0.7
+# Average for false-pos: 6.7 false-neg: 1.5
+# TOTAL: 430317 100.00%
Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 42557 99.43%
-# Correctly spam: 5969 57.95%
-# False positives: 246 0.57%
-# False negatives: 4332 42.05%
-# TCR(l=50): 0.619348 SpamRecall: 57.946% SpamPrec: 96.042%
+# Correctly non-spam: 43222 99.38%
+# Correctly spam: 6130 59.64%
+# False positives: 269 0.62%
+# False negatives: 4148 40.36%
+# TCR(l=50): 0.584044 SpamRecall: 59.642% SpamPrec: 95.796%
##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 335958 97.85%
-# Correctly spam: 45323 55.58%
-# False positives: 7366 2.15%
-# False negatives: 36216 44.42%
-# TCR(l=50): 0.201572 SpamRecall: 55.584% SpamPrec: 86.020%
+# Correctly non-spam: 341485 97.86%
+# Correctly spam: 46616 57.28%
+# False positives: 7451 2.14%
+# False negatives: 34765 42.72%
+# TCR(l=50): 0.199799 SpamRecall: 57.281% SpamPrec: 86.219%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 41898 97.89%
-# Correctly spam: 5734 55.66%
-# False positives: 905 2.11%
-# False negatives: 4567 44.34%
-# TCR(l=50): 0.206777 SpamRecall: 55.664% SpamPrec: 86.368%
+# Correctly non-spam: 42552 97.84%
+# Correctly spam: 5925 57.65%
+# False positives: 939 2.16%
+# False negatives: 4353 42.35%
+# TCR(l=50): 0.200339 SpamRecall: 57.647% SpamPrec: 86.320%
Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1909735&r1=1909734&r2=1909735&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Thu May 11 02:40:12 2023
@@ -1,23 +1,23 @@
##### WITH NEW RULES AND SCORES #####
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 312576 77.843% (98.900% of non-spam corpus)
-# Correctly spam: 56636 14.104% (66.245% of spam corpus)
-# False positives: 3475 0.865% (1.100% of nonspam, 107565 weighted)
-# False negatives: 28859 7.187% (33.755% of spam, 50396 weighted)
-# Average score for spam: 13.5 nonspam: -0.4
-# Average for false-pos: 11.4 false-neg: 1.7
+# Correctly non-spam: 312603 77.850% (98.909% of non-spam corpus)
+# Correctly spam: 56675 14.114% (66.290% of spam corpus)
+# False positives: 3448 0.859% (1.091% of nonspam, 107224 weighted)
+# False negatives: 28820 7.177% (33.710% of spam, 50279 weighted)
+# Average score for spam: 13.1 nonspam: -0.3
+# Average for false-pos: 11.5 false-neg: 1.7
# TOTAL: 401546 100.00%
Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 38979 98.89%
-# Correctly spam: 7112 65.96%
-# False positives: 436 1.11%
-# False negatives: 3670 34.04%
-# TCR(l=50): 0.423322 SpamRecall: 65.962% SpamPrec: 94.224%
+# Correctly non-spam: 38978 98.89%
+# Correctly spam: 7116 66.00%
+# False positives: 437 1.11%
+# False negatives: 3666 34.00%
+# TCR(l=50): 0.422558 SpamRecall: 65.999% SpamPrec: 94.214%
##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...