You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by sp...@apache.org on 2023/05/16 02:41:27 UTC
svn commit: r1909851 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1
Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1909851&r1=1909850&r2=1909851&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Tue May 16 02:41:27 2023
@@ -1,181 +1,180 @@
# Using score set 1 logs for revision 1909791 from:
# ham-net-ena-week0.r1909791.log ham-net-ena-week1.r1909791.log ham-net-ena-week2.r1909791.log ham-net-ena-week3.r1909791.log ham-net-ena-week4.r1909791.log ham-net-giovanni-ham.r1909791.log ham-net-giovanni-spammy.r1909791.log ham-net-giovanni-spam.r1909791.log ham-net-grenier.r1909791.log ham-net-hege.r1909791.log ham-net-jhardin.r1909791.log ham-net-llanga.r1909791.log ham-net-mmiroslaw-mails-ham.r1909791.log ham-net-mmiroslaw-mails-spam.r1909791.log ham-net-spamsponge.r1909791.log ham-net-thendrikx.r1909791.log ham-net-tsz-spam-corpus.r1909791.log spam-net-ena-week0.r1909791.log spam-net-ena-week1.r1909791.log spam-net-ena-week2.r1909791.log spam-net-ena-week3.r1909791.log spam-net-ena-week4.r1909791.log spam-net-giovanni-ham.r1909791.log spam-net-giovanni-spammy.r1909791.log spam-net-giovanni-spam.r1909791.log spam-net-grenier.r1909791.log spam-net-hege.r1909791.log spam-net-jhardin.r1909791.log spam-net-llanga.r1909791.log spam-net-mmiroslaw-mails-ham.r1909791.log spam-net-mmi
roslaw-mails-spam.r1909791.log spam-net-spamsponge.r1909791.log spam-net-thendrikx.r1909791.log spam-net-tsz-spam-corpus.r1909791.log
-score ACCT_PHISHING_MANY 2.999
+score ACCT_PHISHING_MANY 3.000
score AC_BR_BONANZA 0.001 # force non-zero
score AC_DIV_BONANZA 0.001
score AC_FROM_MANY_DOTS 2.999
score AC_HTML_NONSENSE_TAGS 1.999
score ADMITS_SPAM 0.001
score ADVANCE_FEE_2_NEW_MONEY 1.999
-score ADVANCE_FEE_3_NEW_FRM_MNY 1.054
+score ADVANCE_FEE_3_NEW_FRM_MNY 1.209
score ADVANCE_FEE_3_NEW_MONEY 2.399
-score ADVANCE_FEE_4_NEW_MONEY 1.284
-score ADVANCE_FEE_5_NEW_FRM_MNY 2.150
+score ADVANCE_FEE_4_NEW_MONEY 1.280
+score ADVANCE_FEE_5_NEW_FRM_MNY 0.140
score ADVANCE_FEE_5_NEW_MONEY 0.001
-score AD_PREFS 0.326
+score AD_PREFS 0.218
score AMAZON_IMG_NOT_RCVD_AMZN 0.001 # force non-zero
score AXB_XMAILER_MIMEOLE_OL_024C2 0.001
score BIGNUM_EMAILS_FREEM 1.724
-score BITCOIN_DEADLINE 3.000
-score BITCOIN_EXTORT_01 3.988
-score BITCOIN_MALF_HTML 2.500
-score BITCOIN_MALWARE 2.029
-score BITCOIN_SPAM_02 2.500
-score BITCOIN_SPAM_07 2.346
-score BITCOIN_XPRIO 1.256
+score BITCOIN_DEADLINE 1.905
+score BITCOIN_EXTORT_01 3.995
+score BITCOIN_MALF_HTML 3.342
+score BITCOIN_MALWARE 1.223
+score BITCOIN_SPAM_02 2.499
+score BITCOIN_SPAM_07 1.504
+score BITCOIN_XPRIO 0.374
score BITCOIN_YOUR_INFO 2.999
-score BODY_SINGLE_URI 0.317
+score BODY_SINGLE_URI 0.414
score BODY_SINGLE_WORD 0.001
-score BODY_URI_ONLY 1.529
+score BODY_URI_ONLY 1.521
score CK_HELO_GENERIC 0.249
score CTE_8BIT_MISMATCH 0.001
-score DATE_IN_FUTURE_Q_PLUS 2.699
-score DEAR_BENEFICIARY 1.710
+score DATE_IN_FUTURE_Q_PLUS 2.700
+score DEAR_BENEFICIARY 0.001
score DKIMWL_WL_HIGH -0.001
score DKIMWL_WL_MED -0.001 # force non-zero
-score DKIMWL_WL_MEDHI -0.001
+score DKIMWL_WL_MEDHI -0.001 # force non-zero
score DSN_NO_MIMEVERSION 0.001
score ENCRYPTED_MESSAGE -0.999
-score END_FUTURE_EMAILS 2.499
+score END_FUTURE_EMAILS 2.500
score FAKE_REPLY_A1 0.001
-score FAKE_REPLY_B 0.001
+score FAKE_REPLY_B 0.001 # force non-zero
score FILL_THIS_FORM 0.499
score FONT_INVIS_DIRECT 0.001
score FONT_INVIS_LONG_LINE 2.999
-score FONT_INVIS_MSGID 0.339
-score FONT_INVIS_POSTEXTRAS 0.754
-score FORGED_SPF_HELO 0.752
-score FORM_FRAUD 0.999
+score FONT_INVIS_MSGID 0.003
+score FONT_INVIS_POSTEXTRAS 0.560
+score FORGED_SPF_HELO 0.755
+score FORM_FRAUD 1.000
score FORM_FRAUD_5 0.001
score FREEMAIL_FORGED_FROMDOMAIN 0.249
-score FROM_ADDR_WS 2.126
+score FROM_ADDR_WS 2.128
score FROM_FMBLA_NEWDOM28 0.799
-score FROM_GOV_DKIM_AU -0.594
+score FROM_GOV_DKIM_AU -0.136
score FROM_IN_TO_AND_SUBJ 1.899
-score FROM_MISSPACED 1.032
-score FROM_MISSP_EH_MATCH 1.549
+score FROM_MISSPACED 0.907
+score FROM_MISSP_EH_MATCH 1.560
score FROM_MISSP_FREEMAIL 2.999
-score FROM_MISSP_MSFT 0.001
-score FROM_MISSP_REPLYTO 2.144
+score FROM_MISSP_MSFT 0.001 # force non-zero
+score FROM_MISSP_REPLYTO 2.141
score FROM_MISSP_SPF_FAIL 0.001
score FROM_MISSP_USER 0.001
-score FROM_PAYPAL_SPOOF 1.478
-score FROM_SUSPICIOUS_NTLD 0.191
+score FROM_PAYPAL_SPOOF 0.678
+score FROM_SUSPICIOUS_NTLD 0.192
score FROM_SUSPICIOUS_NTLD_FP 1.999
-score FSL_BULK_SIG 0.001
-score FSL_CTYPE_WIN1251 0.001 # force non-zero
-score FSL_NEW_HELO_USER 0.001 # force non-zero
+score FSL_BULK_SIG 0.001 # force non-zero
+score FSL_CTYPE_WIN1251 0.001
+score FSL_NEW_HELO_USER 0.001
score FUZZY_AMAZON 0.001
score GB_CUSTOM_HTM_URI 1.499
-score GB_FAKE_RF_SHORT 1.999
+score GB_FAKE_RF_SHORT 2.000
score GB_FREEMAIL_DISPTO 0.001
score GB_GOOGLE_TRANSL 0.749
-score GB_HASHBL_BTC 4.579
-score GOOG_MALWARE_DNLD 1.894
+score GB_HASHBL_BTC 4.707
+score GOOG_MALWARE_DNLD 1.738
score GOOG_REDIR_HTML_ONLY 1.999
score GOOG_REDIR_NORDNS 3.099
-score GOOG_STO_NOIMG_HTML 2.947
-score HAS_X_OUTGOING_SPAM_STAT 0.798
-score HDRS_MISSP 0.727
+score GOOG_STO_NOIMG_HTML 2.951
+score HAS_X_OUTGOING_SPAM_STAT 0.794
+score HDRS_MISSP 0.722
score HDR_ORDER_FTSDMCXX_DIRECT 0.001
score HDR_ORDER_FTSDMCXX_NORDNS 0.001
-score HEADER_FROM_DIFFERENT_DOMAINS 0.249
-score HELO_NO_DOMAIN 0.164
+score HEADER_FROM_DIFFERENT_DOMAINS 0.250
+score HELO_NO_DOMAIN 0.169
score HK_NAME_MR_MRS 0.999
-score HK_RANDOM_ENVFROM 0.001 # force non-zero
+score HK_RANDOM_ENVFROM 0.001
score HK_RANDOM_FROM 0.001
score HK_RANDOM_REPLYTO 0.999
score HK_SCAM 0.001
-score HOSTED_IMG_DIRECT_MX 0.001 # force non-zero
+score HOSTED_IMG_DIRECT_MX 0.001
score HOSTED_IMG_FREEM 0.001
-score HOSTED_IMG_MULTI_PUB_01 2.999
+score HOSTED_IMG_MULTI_PUB_01 3.000
score HTML_ENTITY_ASCII 2.999
-score HTML_ENTITY_ASCII_TINY 2.975
+score HTML_ENTITY_ASCII_TINY 2.999
score HTML_OFF_PAGE 0.001
-score HTML_TAG_BALANCE_CENTER 2.785
-score HTML_TEXT_INVISIBLE_FONT 1.549
-score HTML_TEXT_INVISIBLE_STYLE 1.390
+score HTML_TAG_BALANCE_CENTER 2.798
+score HTML_TEXT_INVISIBLE_FONT 1.780
+score HTML_TEXT_INVISIBLE_STYLE 1.384
score JH_SPAMMY_HEADERS 3.499
score KHOP_HELO_FCRDNS 0.001
score LONG_HEX_URI 2.999
-score LONG_IMG_URI 0.001
-score LONG_INVISIBLE_TEXT 1.828
+score LONG_IMG_URI 0.001 # force non-zero
+score LONG_INVISIBLE_TEXT 1.831
score LOTS_OF_MONEY 0.010
-score MALWARE_NORDNS 3.376
-score MALWARE_PASSWORD 0.956
+score MALWARE_NORDNS 3.095
+score MALWARE_PASSWORD 1.673
score MILLION_HUNDRED 0.001
score MILLION_USD 1.999
score MIMEOLE_DIRECT_TO_MX 0.001
score MIME_NO_TEXT 1.999
-score MIXED_CENTER_CASE 1.288
-score MIXED_ES 1.699
-score MONEY_ATM_CARD 1.570
+score MIXED_CENTER_CASE 1.318
+score MIXED_ES 1.700
+score MONEY_ATM_CARD 1.046
score MONEY_FORM 0.001
score MONEY_FORM_SHORT 0.001
-score MONEY_FRAUD_3 0.285
+score MONEY_FRAUD_3 0.292
score MONEY_FRAUD_5 2.699
score MONEY_FRAUD_8 0.001
-score MONEY_FREEMAIL_REPTO 2.236
+score MONEY_FREEMAIL_REPTO 2.235
score MONEY_FROM_MISSP 0.001
-score MSMAIL_PRI_ABNORMAL 0.540
+score MSMAIL_PRI_ABNORMAL 1.496
score NA_DOLLARS 0.001
-score NICE_REPLY_A -3.811
+score NICE_REPLY_A -2.666
score NO_FM_NAME_IP_HOSTN 0.001
score NSL_RCVD_FROM_USER 0.001
score NSL_RCVD_HELO_USER 0.001
-score OBFU_TEXT_ATTACH 0.571
+score OBFU_TEXT_ATTACH 0.719
score PDS_BAD_THREAD_QP_64 0.999
score PDS_BRAND_SUBJ_NAKED_TO 0.999
-score PDS_BTC_ID 0.322
-score PDS_BTC_MSGID 0.739
-score PDS_EMPTYSUBJ_URISHRT 1.181
+score PDS_BTC_ID 0.194
+score PDS_BTC_MSGID 0.341
+score PDS_EMPTYSUBJ_URISHRT 1.082
score PDS_FRNOM_TODOM_DBL_URL 1.499
-score PDS_FRNOM_TODOM_NAKED_TO 1.458
-score PDS_FROM_2_EMAILS_SHRTNER 0.980
-score PDS_FROM_NAME_TO_DOMAIN 1.950
-score PDS_NO_FULL_NAME_SPOOFED_URL 0.750
+score PDS_FRNOM_TODOM_NAKED_TO 1.470
+score PDS_FROM_2_EMAILS_SHRTNER 0.172
+score PDS_FROM_NAME_TO_DOMAIN 1.937
+score PDS_NO_FULL_NAME_SPOOFED_URL 0.749
score PDS_SHORT_SPOOFED_URL 1.999
-score PDS_TINYSUBJ_URISHRT 1.499
+score PDS_TINYSUBJ_URISHRT 1.500
score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 0.001
-score PHISH_ATTACH 2.300
-score PHP_ORIG_SCRIPT 1.872
-score PHP_SCRIPT 2.500
+score PHISH_ATTACH 2.299
+score PHP_ORIG_SCRIPT 1.878
+score PHP_SCRIPT 2.499
score POSSIBLE_GMAIL_PHISHER 2.799
score PP_MIME_FAKE_ASCII_TEXT 0.001
-score RAND_HEADER_MANY 1.278
+score RAND_HEADER_MANY 1.418
score RAND_MKTG_HEADER 1.999
-score RATWARE_NO_RDNS 0.200
+score RATWARE_NO_RDNS 0.201
score RCVD_IN_MSPIKE_H2 -0.001
score SCC_BODY_SINGLE_WORD 0.001
-score SCC_ISEMM_LID_1B 1.499
+score SCC_ISEMM_LID_1B 1.500
score SENDGRID_REDIR 1.068
score SERGIO_SUBJECT_VIAGRA01 0.001
score SHOPIFY_IMG_NOT_RCVD_SFY 2.499
score SHORT_SHORTNER 1.999
score SPOOFED_FREEMAIL 0.001
score SPOOFED_FREEMAIL_NO_RDNS 0.001
-score SPOOFED_FREEM_REPTO 0.001
-score SPOOF_GMAIL_MID 0.001 # force non-zero
-score STATIC_XPRIO_OLE 1.661
+score SPOOFED_FREEM_REPTO 0.001 # force non-zero
+score SPOOF_GMAIL_MID 0.001
+score STATIC_XPRIO_OLE 1.662
score SUSP_UTF8_WORD_COMBO 2.999
score SUSP_UTF8_WORD_SUBJ 0.001
score THIS_AD 0.899
-score TONOM_EQ_TOLOC_SHRT_SHRTNER 0.149
-score TO_EQ_FM_DIRECT_MX 0.001 # force non-zero
+score TONOM_EQ_TOLOC_SHRT_SHRTNER 0.151
+score TO_EQ_FM_DIRECT_MX 0.001
score TO_EQ_FM_DOM_SPF_FAIL 0.001
-score TO_EQ_FM_HTML_ONLY 1.899
-score TO_EQ_FM_SPF_FAIL 0.001 # force non-zero
+score TO_EQ_FM_SPF_FAIL 0.001
score TO_IN_SUBJ 0.100
score TO_NAME_SUBJ_NO_RDNS 2.999
-score TO_NO_BRKTS_FROM_MSSP 2.314
+score TO_NO_BRKTS_FROM_MSSP 2.428
score TO_NO_BRKTS_HTML_IMG 1.999
score TO_NO_BRKTS_HTML_ONLY 1.999
score TO_NO_BRKTS_MSFT 0.001
-score TO_NO_BRKTS_NORDNS_HTML 2.000
+score TO_NO_BRKTS_NORDNS_HTML 1.999
score TO_NO_BRKTS_PCNT 2.500
score TR_JS_REDIRECTION_0 2.299
-score TVD_PH_SUBJ_META 2.899
+score TVD_PH_SUBJ_META 2.900
score TVD_SPACE_RATIO_MINFP 0.001
score UNDISC_FREEM 2.699
score UNDISC_MONEY 2.699
@@ -184,18 +183,18 @@ score URI_DOTEDU 1.9
score URI_GOOGLE_PROXY 2.599
score URI_MALWARE_BH 0.999
score URI_ONLY_MSGID_MALF 1.999
-score URI_PHISH 3.995
+score URI_PHISH 3.993
score URI_TRY_3LD 1.999
-score URI_WP_HACKED 1.792
+score URI_WP_HACKED 1.649
score URI_WP_HACKED_2 2.499
score VFY_ACCT_NORDNS 0.001
-score WORD_INVIS 1.604
+score WORD_INVIS 1.941
score WORD_INVIS_MANY 2.999
score XFER_LOTSA_MONEY 0.001
-score XM_RANDOM 0.001 # force non-zero
+score XM_RANDOM 0.001
score XPRIO 0.001
-score YOUR_PERMISSION 2.451
-score YOU_INHERIT 1.584
+score YOUR_PERMISSION 2.480
+score YOU_INHERIT 1.519
score AC_POST_EXTRAS 1.000
score AC_SPAMMY_URI_PATTERNS1 1.000
score AC_SPAMMY_URI_PATTERNS10 1.000
@@ -301,7 +300,6 @@ score JH_SPAMMY_PATTERN02 1.0
score LINKEDIN_IMG_NOT_RCVD_LNKN 1.000
score LIST_PRTL_PUMPDUMP 1.000
score LIST_PRTL_SAME_USER 1.000
-score LOTTO_AGENT 1.000
score LUCRATIVE 1.000
score MALF_HTML_B64 1.000
score MIXED_AREA_CASE 1.000
@@ -322,13 +320,11 @@ score ODD_FREEM_REPTO 1.0
score PDS_DBL_URL_TNB_RUNON 1.000
score PDS_HELO_SPF_FAIL 1.000
score PDS_PHPEXP_BOT 1.000
-score PDS_PHP_EVAL 1.000
score PDS_SHORTFWD_URISHRT 1.000
score PDS_TONAME_EQ_TOLOCAL_HDRS_LCASE 1.000
score PHISH_AZURE_CLOUDAPP 3.500
score PHISH_FBASEAPP 1.000
score PHP_NOVER_MUA 1.000
-score PHP_ORIG_SCRIPT_EVAL 1.000
score PHP_SCRIPT_MUA 1.000
score PP_TOO_MUCH_UNICODE02 0.500
score PP_TOO_MUCH_UNICODE05 1.000
Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1909851&r1=1909850&r2=1909851&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Tue May 16 02:41:27 2023
@@ -1,40 +1,40 @@
##### WITH NEW RULES AND SCORES #####
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 363697 76.716% (99.414% of non-spam corpus)
-# Correctly spam: 72022 15.192% (66.537% of spam corpus)
-# False positives: 2142 0.452% (0.586% of nonspam, 21137 weighted)
-# False negatives: 36221 7.640% (33.463% of spam, 55252 weighted)
-# Average score for spam: 10.6 nonspam: 0.6
-# Average for false-pos: 6.7 false-neg: 1.5
-# TOTAL: 474082 100.00%
+# Correctly non-spam: 365161 74.633% (99.353% of non-spam corpus)
+# Correctly spam: 78889 16.124% (64.802% of spam corpus)
+# False positives: 2379 0.486% (0.647% of nonspam, 27032 weighted)
+# False negatives: 42849 8.758% (35.198% of spam, 70159 weighted)
+# Average score for spam: 10.5 nonspam: 0.7
+# Average for false-pos: 6.9 false-neg: 1.6
+# TOTAL: 489278 100.00%
Reading scores from "tmprules"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 45325 99.39%
-# Correctly spam: 9011 65.94%
-# False positives: 279 0.61%
-# False negatives: 4654 34.06%
-# TCR(l=50): 0.734519 SpamRecall: 65.942% SpamPrec: 96.997%
+# Correctly non-spam: 45540 99.44%
+# Correctly spam: 9857 64.45%
+# False positives: 256 0.56%
+# False negatives: 5437 35.55%
+# TCR(l=50): 0.838625 SpamRecall: 64.450% SpamPrec: 97.469%
##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 358096 97.88%
-# Correctly spam: 63428 58.60%
-# False positives: 7743 2.12%
-# False negatives: 44815 41.40%
-# TCR(l=50): 0.250583 SpamRecall: 58.598% SpamPrec: 89.121%
+# Correctly non-spam: 359676 97.86%
+# Correctly spam: 67451 55.41%
+# False positives: 7864 2.14%
+# False negatives: 54287 44.59%
+# TCR(l=50): 0.272048 SpamRecall: 55.407% SpamPrec: 89.559%
Reading scores from "../rules-base"...
Reading per-message hit stat logs and scores...
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 44558 97.71%
-# Correctly spam: 8045 58.87%
-# False positives: 1046 2.29%
-# False negatives: 5620 41.13%
-# TCR(l=50): 0.235929 SpamRecall: 58.873% SpamPrec: 88.494%
+# Correctly non-spam: 44796 97.82%
+# Correctly spam: 8495 55.54%
+# False positives: 1000 2.18%
+# False negatives: 6799 44.46%
+# TCR(l=50): 0.269265 SpamRecall: 55.545% SpamPrec: 89.468%
Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1909851&r1=1909850&r2=1909851&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Tue May 16 02:41:27 2023
@@ -1,12 +1,12 @@
##### WITH NEW RULES AND SCORES #####
# SUMMARY for threshold 5.0:
-# Correctly non-spam: 360126 77.840% (99.004% of non-spam corpus)
-# Correctly spam: 65835 14.230% (66.567% of spam corpus)
-# False positives: 3622 0.783% (0.996% of nonspam, 115634 weighted)
-# False negatives: 33065 7.147% (33.433% of spam, 54969 weighted)
-# Average score for spam: 13.8 nonspam: -0.3
-# Average for false-pos: 11.7 false-neg: 1.7
+# Correctly non-spam: 360112 77.837% (99.000% of non-spam corpus)
+# Correctly spam: 66068 14.280% (66.803% of spam corpus)
+# False positives: 3636 0.786% (1.000% of nonspam, 115820 weighted)
+# False negatives: 32832 7.097% (33.197% of spam, 53725 weighted)
+# Average score for spam: 14.0 nonspam: -0.3
+# Average for false-pos: 11.7 false-neg: 1.6
# TOTAL: 462648 100.00%
Reading scores from "tmprules"...
@@ -14,10 +14,10 @@ Reading per-message hit stat logs and sc
# SUMMARY for threshold 5.0:
# Correctly non-spam: 44928 99.08%
-# Correctly spam: 8220 65.85%
+# Correctly spam: 8258 66.15%
# False positives: 417 0.92%
-# False negatives: 4263 34.15%
-# TCR(l=50): 0.497073 SpamRecall: 65.850% SpamPrec: 95.172%
+# False negatives: 4225 33.85%
+# TCR(l=50): 0.497827 SpamRecall: 66.154% SpamPrec: 95.193%
##### WITHOUT NEW RULES AND SCORES #####
Reading scores from "../rules-base"...