You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by sp...@apache.org on 2023/05/11 02:40:12 UTC

svn commit: r1909735 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1

Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1909735&r1=1909734&r2=1909735&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Thu May 11 02:40:12 2023
@@ -1,196 +1,197 @@
 # Using score set 1 logs for revision 1909647 from:
 # ham-net-ena-week0.r1909647.log ham-net-ena-week1.r1909647.log ham-net-ena-week2.r1909647.log ham-net-ena-week3.r1909647.log ham-net-ena-week4.r1909647.log ham-net-giovanni-ham.r1909647.log ham-net-giovanni-spammy.r1909647.log ham-net-giovanni-spam.r1909647.log ham-net-grenier.r1909647.log ham-net-hege.r1909647.log ham-net-jhardin.r1909647.log ham-net-llanga.r1909647.log ham-net-mmiroslaw-mails-ham.r1909647.log ham-net-mmiroslaw-mails-spam.r1909647.log ham-net-spamsponge.r1909647.log ham-net-thendrikx.r1909647.log spam-net-ena-week0.r1909647.log spam-net-ena-week1.r1909647.log spam-net-ena-week2.r1909647.log spam-net-ena-week3.r1909647.log spam-net-ena-week4.r1909647.log spam-net-giovanni-ham.r1909647.log spam-net-giovanni-spammy.r1909647.log spam-net-giovanni-spam.r1909647.log spam-net-grenier.r1909647.log spam-net-hege.r1909647.log spam-net-jhardin.r1909647.log spam-net-llanga.r1909647.log spam-net-mmiroslaw-mails-ham.r1909647.log spam-net-mmiroslaw-mails-spam.r1909647.log spam-n
 et-spamsponge.r1909647.log spam-net-thendrikx.r1909647.log
 
-score ACCT_PHISHING_MANY             3.000
+score ACCT_PHISHING_MANY             2.999
 score AC_BR_BONANZA                  0.001
 score AC_DIV_BONANZA                 0.001
 score AC_FROM_MANY_DOTS              2.999
-score AC_HTML_NONSENSE_TAGS          1.915
+score AC_HTML_NONSENSE_TAGS          1.916
 score ADMITS_SPAM                    0.001
-score ADVANCE_FEE_2_NEW_MONEY        1.999
+score ADVANCE_FEE_2_NEW_MONEY        2.000
 score ADVANCE_FEE_3_NEW              3.499
-score ADVANCE_FEE_3_NEW_FRM_MNY      0.544
+score ADVANCE_FEE_3_NEW_FRM_MNY      0.601
 score ADVANCE_FEE_3_NEW_MONEY        2.299
 score ADVANCE_FEE_4_NEW_FRM_MNY      0.001
-score ADVANCE_FEE_4_NEW_MONEY        2.243
-score ADVANCE_FEE_5_NEW_FRM_MNY      0.892
+score ADVANCE_FEE_4_NEW_MONEY        2.399
+score ADVANCE_FEE_5_NEW_FRM_MNY      1.212
 score ADVANCE_FEE_5_NEW_MONEY        0.001
-score AD_PREFS                       0.469
+score AD_PREFS                       0.430
 score AMAZON_IMG_NOT_RCVD_AMZN       0.001
 score AXB_XMAILER_MIMEOLE_OL_024C2   0.001
 score BITCOIN_DEADLINE               2.999
-score BITCOIN_MALF_HTML              1.483
-score BITCOIN_MALWARE                2.234
+score BITCOIN_MALF_HTML              1.494
+score BITCOIN_MALWARE                1.977
 score BITCOIN_OBFU_SUBJ              1.765
-score BITCOIN_SPAM_02                1.535
+score BITCOIN_SPAM_02                2.303
 score BITCOIN_SPAM_07                3.499
-score BITCOIN_XPRIO                  2.300
-score BITCOIN_YOUR_INFO              2.839
-score BODY_SINGLE_URI                0.465
+score BITCOIN_XPRIO                  2.197
+score BITCOIN_YOUR_INFO              2.532
+score BODY_SINGLE_URI                0.425
 score BODY_SINGLE_WORD               0.001
-score BODY_URI_ONLY                  2.026
+score BODY_URI_ONLY                  2.066
 score CK_HELO_GENERIC                0.249
-score CTE_8BIT_MISMATCH              0.001
-score DATE_IN_FUTURE_Q_PLUS          2.400
-score DEAR_BENEFICIARY               1.666
+score CTE_8BIT_MISMATCH              0.001 # force non-zero
+score DATE_IN_FUTURE_Q_PLUS          2.399
+score DEAR_BENEFICIARY               2.538
 score DKIMWL_WL_HIGH                 -0.001
 score DKIMWL_WL_MED                  -0.001 # force non-zero
 score DKIMWL_WL_MEDHI                -0.001
 score END_FUTURE_EMAILS              2.499
-score FILL_THIS_FORM                 0.599
+score FILL_THIS_FORM                 0.600
 score FONT_INVIS_DIRECT              0.001
 score FONT_INVIS_LONG_LINE           2.999
-score FONT_INVIS_MSGID               0.880
-score FONT_INVIS_POSTEXTRAS          0.914
-score FORGED_SPF_HELO                1.800
+score FONT_INVIS_MSGID               0.911
+score FONT_INVIS_POSTEXTRAS          0.752
+score FORGED_SPF_HELO                1.799
 score FORM_FRAUD                     0.999
 score FORM_FRAUD_5                   0.001
-score FREEMAIL_FORGED_FROMDOMAIN     0.250
+score FREEMAIL_FORGED_FROMDOMAIN     0.249
 score FROM_ADDR_WS                   2.999
-score FROM_FMBLA_NEWDOM14            0.001 # force non-zero
+score FROM_FMBLA_NEWDOM14            0.001
 score FROM_FMBLA_NEWDOM28            0.799
-score FROM_GOV_DKIM_AU               -0.435
+score FROM_GOV_DKIM_AU               -0.206
 score FROM_IN_TO_AND_SUBJ            1.799
-score FROM_MISSPACED                 0.540
-score FROM_MISSP_EH_MATCH            1.853
-score FROM_MISSP_FREEMAIL            2.696
+score FROM_MISSPACED                 0.458
+score FROM_MISSP_EH_MATCH            1.935
+score FROM_MISSP_FREEMAIL            2.614
 score FROM_MISSP_MSFT                0.001
-score FROM_MISSP_REPLYTO             2.143
-score FROM_MISSP_SPF_FAIL            0.001
+score FROM_MISSP_REPLYTO             2.146
+score FROM_MISSP_SPF_FAIL            0.001 # force non-zero
 score FROM_MISSP_USER                0.001
-score FROM_PAYPAL_SPOOF              0.001
-score FROM_SUSPICIOUS_NTLD           0.191
-score FROM_SUSPICIOUS_NTLD_FP        2.000
+score FROM_PAYPAL_SPOOF              0.965
+score FROM_SUSPICIOUS_NTLD           0.190
+score FROM_SUSPICIOUS_NTLD_FP        1.999
 score FSL_BULK_SIG                   0.001
 score FSL_CTYPE_WIN1251              0.001
-score FSL_NEW_HELO_USER              0.001
-score FUZZY_AMAZON                   0.001
+score FSL_NEW_HELO_USER              0.001 # force non-zero
+score FUZZY_AMAZON                   0.001 # force non-zero
 score GB_CUSTOM_HTM_URI              0.835
-score GB_FAKE_RF_SHORT               1.999
+score GB_FAKE_RF_SHORT               2.000
 score GB_FREEMAIL_DISPTO             0.001
-score GB_GOOGLE_TRANSL               0.589
-score GB_HASHBL_BTC                  4.902
+score GB_GOOGLE_TRANSL               0.587
+score GB_HASHBL_BTC                  4.699
 score GOOG_REDIR_HTML_ONLY           1.999
 score GOOG_REDIR_NORDNS              2.899
-score GOOG_STO_NOIMG_HTML            2.950
-score HAS_X_OUTGOING_SPAM_STAT       0.794
-score HDRS_MISSP                     0.778
+score GOOG_STO_NOIMG_HTML            2.946
+score HAS_X_OUTGOING_SPAM_STAT       0.797
+score HDRS_MISSP                     0.768
 score HDR_ORDER_FTSDMCXX_DIRECT      0.001
-score HDR_ORDER_FTSDMCXX_NORDNS      0.001 # force non-zero
-score HEADER_FROM_DIFFERENT_DOMAINS  0.249
-score HELO_NO_DOMAIN                 0.001
+score HDR_ORDER_FTSDMCXX_NORDNS      0.001
+score HEADER_FROM_DIFFERENT_DOMAINS  0.250
+score HELO_NO_DOMAIN                 0.006
 score HK_NAME_MR_MRS                 0.999
 score HK_RANDOM_ENVFROM              0.001
 score HK_RANDOM_FROM                 0.001
 score HK_RANDOM_REPLYTO              0.999
-score HK_SCAM                        0.416
+score HK_SCAM                        0.428
 score HOSTED_IMG_DIRECT_MX           0.001
-score HOSTED_IMG_FREEM               2.088
+score HOSTED_IMG_FREEM               2.079
 score HTML_FONT_TINY_NORDNS          0.001
 score HTML_OFF_PAGE                  0.001
-score HTML_TAG_BALANCE_CENTER        2.521
-score HTML_TEXT_INVISIBLE_FONT       1.500
-score HTML_TEXT_INVISIBLE_STYLE      0.001 # force non-zero
-score JH_SPAMMY_HEADERS              3.499
+score HTML_TAG_BALANCE_CENTER        2.494
+score HTML_TEXT_INVISIBLE_FONT       1.514
+score HTML_TEXT_INVISIBLE_STYLE      0.001
+score JH_SPAMMY_HEADERS              3.500
 score KHOP_HELO_FCRDNS               0.001
-score LONG_HEX_URI                   2.999
-score LONG_IMG_URI                   0.001 # force non-zero
-score LONG_INVISIBLE_TEXT            1.826
+score LONG_HEX_URI                   3.000
+score LONG_IMG_URI                   0.001
+score LONG_INVISIBLE_TEXT            1.827
 score LOTS_OF_MONEY                  0.010
-score MALWARE_NORDNS                 0.776
-score MALWARE_PASSWORD               0.428
+score MALWARE_NORDNS                 3.238
+score MALWARE_PASSWORD               1.251
 score MANY_SPAN_IN_TEXT              2.199
 score MILLION_HUNDRED                0.001
-score MILLION_USD                    1.999
-score MIMEOLE_DIRECT_TO_MX           0.001
+score MILLION_USD                    1.046
+score MIMEOLE_DIRECT_TO_MX           0.001 # force non-zero
 score MIME_NO_TEXT                   1.999
-score MIXED_CENTER_CASE              2.492
-score MIXED_ES                       0.772
-score MIXED_HREF_CASE                0.690
-score MONEY_ATM_CARD                 0.001
+score MIXED_CENTER_CASE              2.218
+score MIXED_ES                       0.768
+score MIXED_HREF_CASE                1.790
+score MONEY_ATM_CARD                 1.874
 score MONEY_FORM                     0.001
 score MONEY_FORM_SHORT               0.001
 score MONEY_FRAUD_3                  0.001
-score MONEY_FRAUD_5                  2.263
-score MONEY_FRAUD_8                  0.012
-score MONEY_FREEMAIL_REPTO           2.132
+score MONEY_FRAUD_5                  2.261
+score MONEY_FRAUD_8                  0.001
+score MONEY_FREEMAIL_REPTO           2.136
 score MONEY_FROM_MISSP               0.001
-score MSMAIL_PRI_ABNORMAL            1.280
+score MSMAIL_PRI_ABNORMAL            0.302
 score NA_DOLLARS                     0.495
-score NICE_REPLY_A                   -3.251
+score NICE_REPLY_A                   -2.124
 score NO_FM_NAME_IP_HOSTN            0.001
 score NSL_RCVD_FROM_USER             0.001
-score NSL_RCVD_HELO_USER             0.001
-score OBFU_TEXT_ATTACH               0.935
-score PDS_BAD_THREAD_QP_64           1.000
-score PDS_BTC_ID                     0.001
-score PDS_BTC_MSGID                  0.438
-score PDS_EMPTYSUBJ_URISHRT          0.783
-score PDS_FRNOM_TODOM_DBL_URL        1.499
+score NSL_RCVD_HELO_USER             0.001 # force non-zero
+score OBFU_TEXT_ATTACH               0.540
+score PDS_BAD_THREAD_QP_64           0.999
+score PDS_BTC_ID                     0.203
+score PDS_BTC_MSGID                  0.999
+score PDS_EMPTYSUBJ_URISHRT          0.824
+score PDS_FRNOM_TODOM_DBL_URL        1.421
 score PDS_FRNOM_TODOM_NAKED_TO       1.499
-score PDS_FROM_2_EMAILS_SHRTNER      1.312
+score PDS_FROM_2_EMAILS_SHRTNER      1.177
 score PDS_FROM_NAME_TO_DOMAIN        1.999
-score PDS_HELO_SPF_FAIL              0.001
+score PDS_HELO_SPF_FAIL              1.069
 score PDS_NO_FULL_NAME_SPOOFED_URL   0.749
 score PDS_SHORT_SPOOFED_URL          1.999
 score PDS_TINYSUBJ_URISHRT           1.499
 score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 0.001
-score PHP_SCRIPT                     2.499
+score PHP_SCRIPT                     2.500
 score POSSIBLE_AMAZON_PHISH_02       2.299
-score POSSIBLE_GMAIL_PHISHER         1.590
+score POSSIBLE_GMAIL_PHISHER         2.238
 score PP_MIME_FAKE_ASCII_TEXT        0.001
-score RAND_HEADER_MANY               1.969
-score RAND_MKTG_HEADER               1.999
+score RAND_HEADER_MANY               1.966
+score RAND_MKTG_HEADER               2.000
 score RATWARE_NO_RDNS                0.001
 score RCVD_IN_MSPIKE_H2              -0.001 # force non-zero
-score SCC_BODY_SINGLE_WORD           0.001
+score SCC_BODY_SINGLE_WORD           0.001 # force non-zero
 score SCC_ISEMM_LID_1B               1.499
-score SENDGRID_REDIR                 0.790
+score SENDGRID_REDIR                 0.789
 score SERGIO_SUBJECT_VIAGRA01        0.001
 score SHOPIFY_IMG_NOT_RCVD_SFY       2.499
 score SHORT_SHORTNER                 1.999
 score SPOOFED_FREEMAIL               0.001 # force non-zero
 score SPOOFED_FREEMAIL_NO_RDNS       0.001
-score SPOOFED_FREEM_REPTO            0.001 # force non-zero
+score SPOOFED_FREEM_REPTO            0.001
 score SPOOF_GMAIL_MID                0.001
-score STATIC_XPRIO_OLE               1.861
-score STOX_BOUND_090909_B            3.202
-score SUSP_UTF8_WORD_COMBO           1.464
-score SUSP_UTF8_WORD_SUBJ            1.899
+score STATIC_XPRIO_OLE               1.862
+score STOX_BOUND_090909_B            1.877
+score SUSP_UTF8_WORD_COMBO           1.458
+score SUSP_UTF8_WORD_SUBJ            1.900
 score THIS_AD                        0.799
-score TONOM_EQ_TOLOC_SHRT_SHRTNER    0.401
-score TO_EQ_FM_DIRECT_MX             0.254
+score TONOM_EQ_TOLOC_SHRT_SHRTNER    0.396
+score TO_EQ_FM_DIRECT_MX             0.246
+score TO_EQ_FM_DOM_HTML_ONLY         1.823
 score TO_EQ_FM_DOM_SPF_FAIL          0.001
 score TO_EQ_FM_SPF_FAIL              0.001
 score TO_IN_SUBJ                     0.099
 score TO_NAME_SUBJ_NO_RDNS           2.999
-score TO_NO_BRKTS_FROM_MSSP          2.500
+score TO_NO_BRKTS_FROM_MSSP          2.499
 score TO_NO_BRKTS_HTML_IMG           1.999
 score TO_NO_BRKTS_HTML_ONLY          1.999
 score TO_NO_BRKTS_MSFT               0.001
-score TO_NO_BRKTS_NORDNS_HTML        1.822
+score TO_NO_BRKTS_NORDNS_HTML        1.824
 score TO_NO_BRKTS_PCNT               2.499
 score TR_JS_REDIRECTION_0            2.199
 score TVD_SPACE_ENCODED              0.001
-score TVD_SPACE_RATIO_MINFP          0.001
+score TVD_SPACE_RATIO_MINFP          0.001 # force non-zero
 score UNDISC_FREEM                   2.699
 score UNDISC_MONEY                   2.899
 score UNICODE_OBFU_ASC               2.499
 score URI_DOTEDU                     1.999
-score URI_GOOGLE_PROXY               2.400
+score URI_GOOGLE_PROXY               2.399
 score URI_MALWARE_BH                 0.999
-score URI_ONLY_MSGID_MALF            0.419
-score URI_PHISH                      3.797
+score URI_ONLY_MSGID_MALF            1.243
+score URI_PHISH                      3.625
 score URI_TRY_3LD                    1.999
-score URI_WP_HACKED                  0.769
-score URI_WP_HACKED_2                2.499
+score URI_WP_HACKED                  0.770
+score URI_WP_HACKED_2                2.500
 score VFY_ACCT_NORDNS                0.001
-score WORD_INVIS                     0.809
+score WORD_INVIS                     0.807
 score WORD_INVIS_MANY                2.999
 score XFER_LOTSA_MONEY               0.001 # force non-zero
 score XM_RANDOM                      0.001
 score XPRIO                          0.001
-score YOU_INHERIT                    1.682
+score YOU_INHERIT                    0.266
 score AC_POST_EXTRAS                 1.000
 score AC_SPAMMY_URI_PATTERNS1        1.000
 score AC_SPAMMY_URI_PATTERNS10       1.000
@@ -280,6 +281,7 @@ score GOOG_STO_HTML_PHISH_MANY       1.0
 score GOOG_STO_IMG_HTML              1.000
 score GOOG_STO_IMG_NOHTML            1.000
 score HAS_X_NO_RELAY                 1.000
+score HDRS_LCASE                     0.100
 score HEXHASH_WORD                   1.000
 score HK_CTE_RAW                     1.000
 score HK_LOTTO                       1.000

Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1909735&r1=1909734&r2=1909735&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Thu May 11 02:40:12 2023
@@ -1,40 +1,40 @@
 ##### WITH NEW RULES AND SCORES #####
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 341130  80.292%  (99.361% of non-spam corpus)
-# Correctly spam:      48245  11.355%  (59.168% of spam corpus)
-# False positives:      2194  0.516%  (0.639% of nonspam,  17170 weighted)
-# False negatives:     33294  7.836%  (40.832% of spam,  51688 weighted)
-# Average score for spam:  9.4    nonspam: 0.5
-# Average for false-pos:   6.6  false-neg: 1.6
-# TOTAL:              424863  100.00%
+# Correctly non-spam: 346810  80.594%  (99.391% of non-spam corpus)
+# Correctly spam:      49033  11.395%  (60.251% of spam corpus)
+# False positives:      2126  0.494%  (0.609% of nonspam,  16574 weighted)
+# False negatives:     32348  7.517%  (39.749% of spam,  48728 weighted)
+# Average score for spam:  9.3    nonspam: 0.7
+# Average for false-pos:   6.7  false-neg: 1.5
+# TOTAL:              430317  100.00%
 
 Reading scores from "tmprules"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  42557  99.43%
-# Correctly spam:       5969  57.95%
-# False positives:       246  0.57%
-# False negatives:      4332  42.05%
-# TCR(l=50): 0.619348  SpamRecall: 57.946%  SpamPrec: 96.042%
+# Correctly non-spam:  43222  99.38%
+# Correctly spam:       6130  59.64%
+# False positives:       269  0.62%
+# False negatives:      4148  40.36%
+# TCR(l=50): 0.584044  SpamRecall: 59.642%  SpamPrec: 95.796%
 
 ##### WITHOUT NEW RULES AND SCORES #####
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 335958  97.85%
-# Correctly spam:      45323  55.58%
-# False positives:      7366  2.15%
-# False negatives:     36216  44.42%
-# TCR(l=50): 0.201572  SpamRecall: 55.584%  SpamPrec: 86.020%
+# Correctly non-spam: 341485  97.86%
+# Correctly spam:      46616  57.28%
+# False positives:      7451  2.14%
+# False negatives:     34765  42.72%
+# TCR(l=50): 0.199799  SpamRecall: 57.281%  SpamPrec: 86.219%
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  41898  97.89%
-# Correctly spam:       5734  55.66%
-# False positives:       905  2.11%
-# False negatives:      4567  44.34%
-# TCR(l=50): 0.206777  SpamRecall: 55.664%  SpamPrec: 86.368%
+# Correctly non-spam:  42552  97.84%
+# Correctly spam:       5925  57.65%
+# False positives:       939  2.16%
+# False negatives:      4353  42.35%
+# TCR(l=50): 0.200339  SpamRecall: 57.647%  SpamPrec: 86.320%

Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1909735&r1=1909734&r2=1909735&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Thu May 11 02:40:12 2023
@@ -1,23 +1,23 @@
 ##### WITH NEW RULES AND SCORES #####
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 312576  77.843%  (98.900% of non-spam corpus)
-# Correctly spam:      56636  14.104%  (66.245% of spam corpus)
-# False positives:      3475  0.865%  (1.100% of nonspam, 107565 weighted)
-# False negatives:     28859  7.187%  (33.755% of spam,  50396 weighted)
-# Average score for spam:  13.5    nonspam: -0.4
-# Average for false-pos:   11.4  false-neg: 1.7
+# Correctly non-spam: 312603  77.850%  (98.909% of non-spam corpus)
+# Correctly spam:      56675  14.114%  (66.290% of spam corpus)
+# False positives:      3448  0.859%  (1.091% of nonspam, 107224 weighted)
+# False negatives:     28820  7.177%  (33.710% of spam,  50279 weighted)
+# Average score for spam:  13.1    nonspam: -0.3
+# Average for false-pos:   11.5  false-neg: 1.7
 # TOTAL:              401546  100.00%
 
 Reading scores from "tmprules"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  38979  98.89%
-# Correctly spam:       7112  65.96%
-# False positives:       436  1.11%
-# False negatives:      3670  34.04%
-# TCR(l=50): 0.423322  SpamRecall: 65.962%  SpamPrec: 94.224%
+# Correctly non-spam:  38978  98.89%
+# Correctly spam:       7116  66.00%
+# False positives:       437  1.11%
+# False negatives:      3666  34.00%
+# TCR(l=50): 0.422558  SpamRecall: 65.999%  SpamPrec: 94.214%
 
 ##### WITHOUT NEW RULES AND SCORES #####
 Reading scores from "../rules-base"...