You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by sp...@apache.org on 2023/02/03 02:40:09 UTC

svn commit: r1907229 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1

Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1907229&r1=1907228&r2=1907229&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Fri Feb  3 02:40:09 2023
@@ -3,180 +3,181 @@
 
 score AC_BR_BONANZA                  0.001
 score AC_DIV_BONANZA                 0.001
-score AC_FROM_MANY_DOTS              2.707
+score AC_FROM_MANY_DOTS              1.804
 score AC_HTML_NONSENSE_TAGS          1.999
-score ADMITS_SPAM                    0.001
-score ADVANCE_FEE_2_NEW_FRM_MNY      1.507
+score ADMITS_SPAM                    0.001 # force non-zero
+score ADVANCE_FEE_2_NEW_FRM_MNY      2.022
 score ADVANCE_FEE_2_NEW_MONEY        1.999
 score ADVANCE_FEE_3_NEW              3.499
-score ADVANCE_FEE_3_NEW_MONEY        2.291
+score ADVANCE_FEE_3_NEW_MONEY        2.345
 score ADVANCE_FEE_4_NEW              2.599
-score ADVANCE_FEE_4_NEW_FRM_MNY      0.552
-score ADVANCE_FEE_4_NEW_MONEY        1.582
+score ADVANCE_FEE_4_NEW_FRM_MNY      0.001
+score ADVANCE_FEE_4_NEW_MONEY        1.739
 score ADVANCE_FEE_5_NEW_FRM_MNY      0.001
-score ADVANCE_FEE_5_NEW_MONEY        0.749
-score AD_PREFS                       0.415
+score ADVANCE_FEE_5_NEW_MONEY        0.934
+score AD_PREFS                       0.390
 score AMAZON_IMG_NOT_RCVD_AMZN       0.001
 score AXB_XMAILER_MIMEOLE_OL_024C2   0.001 # force non-zero
-score BIGNUM_EMAILS_FREEM            2.127
-score BIGNUM_EMAILS_MANY             3.000
+score BIGNUM_EMAILS_FREEM            2.810
+score BIGNUM_EMAILS_MANY             2.999
 score BITCOIN_DEADLINE               2.517
-score BITCOIN_EXTORT_01              1.645
-score BITCOIN_MALF_HTML              1.491
-score BITCOIN_MALWARE                2.483
-score BITCOIN_OBFU_SUBJ              0.973
-score BITCOIN_SPAM_02                1.454
-score BITCOIN_SPAM_05                0.915
+score BITCOIN_EXTORT_01              1.355
+score BITCOIN_MALF_HTML              0.730
+score BITCOIN_MALWARE                1.866
+score BITCOIN_OBFU_SUBJ              0.088
+score BITCOIN_SPAM_02                1.397
+score BITCOIN_SPAM_05                1.461
 score BITCOIN_SPAM_09                1.499
-score BITCOIN_XPRIO                  0.575
+score BITCOIN_XPRIO                  0.001
 score BITCOIN_YOUR_INFO              2.999
-score BODY_URI_ONLY                  2.378
-score CK_HELO_GENERIC                0.249
+score BODY_URI_ONLY                  2.379
+score CK_HELO_GENERIC                0.250
 score CONTENT_AFTER_HTML_WEAK        1.499
 score CTE_8BIT_MISMATCH              0.001
-score DEAR_BENEFICIARY               1.200
-score DEAR_EMAIL_USER                1.997
-score DKIMWL_WL_HIGH                 -0.001
-score DKIMWL_WL_MED                  -0.001
+score DEAR_BENEFICIARY               1.201
+score DEAR_EMAIL_USER                1.830
+score DKIMWL_WL_HIGH                 -0.001 # force non-zero
+score DKIMWL_WL_MED                  -0.001 # force non-zero
 score DKIMWL_WL_MEDHI                -0.001
 score DX_TEXT_03                     1.799
 score ENCRYPTED_MESSAGE              -0.999
 score END_FUTURE_EMAILS              2.499
 score FILL_THIS_FORM                 0.001
-score FONT_INVIS_DIRECT              0.001
+score FONT_INVIS_DIRECT              0.001 # force non-zero
 score FONT_INVIS_LONG_LINE           2.999
-score FONT_INVIS_MSGID               2.202
+score FONT_INVIS_MSGID               2.066
 score FONT_INVIS_POSTEXTRAS          0.001
-score FORGED_SPF_HELO                1.355
+score FORGED_SPF_HELO                1.354
 score FORM_FRAUD                     1.000
-score FORM_FRAUD_3                   1.347
-score FORM_FRAUD_5                   0.673
-score FREEMAIL_FORGED_FROMDOMAIN     0.250
-score FROM_2_EMAILS_SHORT            2.452
-score FROM_ADDR_WS                   3.000
+score FORM_FRAUD_3                   2.015
+score FORM_FRAUD_5                   1.539
+score FREEMAIL_FORGED_FROMDOMAIN     0.249
+score FROM_2_EMAILS_SHORT            2.397
+score FROM_ADDR_WS                   2.999
 score FROM_FMBLA_NEWDOM              0.001
 score FROM_FMBLA_NEWDOM28            0.799
 score FROM_GOV_DKIM_AU               -0.999
 score FROM_MISSP_EH_MATCH            1.999
-score FROM_MISSP_REPLYTO             0.001 # force non-zero
+score FROM_MISSP_REPLYTO             0.001
 score FROM_MISSP_SPF_FAIL            1.999
-score FROM_MULTI_NORDNS              0.713
-score FROM_PAYPAL_SPOOF              0.937
-score FROM_SUSPICIOUS_NTLD           0.500
-score FROM_SUSPICIOUS_NTLD_FP        1.999
-score FSL_BULK_SIG                   0.001
+score FROM_MULTI_NORDNS              0.067
+score FROM_PAYPAL_SPOOF              0.854
+score FROM_SUSPICIOUS_NTLD           0.499
+score FROM_SUSPICIOUS_NTLD_FP        2.000
+score FSL_BULK_SIG                   0.001 # force non-zero
 score FSL_NEW_HELO_USER              0.001
 score FUZZY_AMAZON                   0.001
-score FUZZY_CLICK_HERE               2.228
+score FUZZY_CLICK_HERE               2.978
 score FUZZY_UNSUBSCRIBE              3.099
-score GB_CUSTOM_HTM_URI              0.392
-score GB_FAKE_RF_SHORT               0.826
-score GB_FREEMAIL_DISPTO             0.001 # force non-zero
-score GB_HASHBL_BTC                  2.019
+score GB_CUSTOM_HTM_URI              0.037
+score GB_FAKE_RF_SHORT               0.820
+score GB_FREEMAIL_DISPTO             0.001
+score GB_HASHBL_BTC                  2.494
 score GOOG_REDIR_NORDNS              2.799
-score GOOG_STO_IMG_HTML              1.883
-score GOOG_STO_NOIMG_HTML            2.949
-score HAS_X_OUTGOING_SPAM_STAT       0.795
-score HDRS_LCASE_IMGONLY             0.099
-score HDRS_MISSP                     1.400
+score GOOG_STO_IMG_HTML              2.702
+score GOOG_STO_NOIMG_HTML            2.950
+score HAS_X_OUTGOING_SPAM_STAT       0.796
+score HDRS_LCASE_IMGONLY             0.100
+score HDRS_MISSP                     1.397
 score HDR_ORDER_FTSDMCXX_DIRECT      0.001
-score HDR_ORDER_FTSDMCXX_NORDNS      0.001
+score HDR_ORDER_FTSDMCXX_NORDNS      0.001 # force non-zero
 score HEADER_FROM_DIFFERENT_DOMAINS  0.250
-score HELO_NO_DOMAIN                 0.001
+score HELO_NO_DOMAIN                 0.001 # force non-zero
 score HK_LOTTO                       0.999
 score HK_RANDOM_ENVFROM              0.001
-score HK_RANDOM_FROM                 1.000
-score HK_RANDOM_REPLYTO              0.999
+score HK_RANDOM_FROM                 0.999
+score HK_RANDOM_REPLYTO              1.000
 score HK_SCAM                        1.999
-score HOSTED_IMG_DIRECT_MX           0.001 # force non-zero
-score HOSTED_IMG_FREEM               2.188
+score HOSTED_IMG_DIRECT_MX           0.001
+score HOSTED_IMG_FREEM               2.192
 score HOSTED_IMG_MULTI_PUB_01        2.999
 score HTML_OFF_PAGE                  0.001
 score HTML_TAG_BALANCE_CENTER        3.599
-score HTML_TEXT_INVISIBLE_FONT       0.250
-score HTML_TEXT_INVISIBLE_STYLE      2.801
+score HTML_TEXT_INVISIBLE_FONT       0.386
+score HTML_TEXT_INVISIBLE_STYLE      2.802
 score JH_SPAMMY_HEADERS              3.499
-score KHOP_HELO_FCRDNS               0.001 # force non-zero
-score LONG_HEX_URI                   2.658
+score KHOP_HELO_FCRDNS               0.001
+score LONG_HEX_URI                   2.666
 score LONG_IMG_URI                   0.001
 score LONG_INVISIBLE_TEXT            2.999
 score LOTS_OF_MONEY                  0.010
-score MALWARE_NORDNS                 0.307
+score MALWARE_NORDNS                 0.673
 score MILLION_HUNDRED                2.599
-score MILLION_USD                    1.031
+score MILLION_USD                    0.853
 score MIMEOLE_DIRECT_TO_MX           0.001
-score MIXED_HREF_CASE                0.047
-score MONEY_ATM_CARD                 2.479
+score MIXED_HREF_CASE                1.999
+score MONEY_ATM_CARD                 1.835
 score MONEY_FORM                     0.331
 score MONEY_FORM_SHORT               2.499
 score MONEY_FRAUD_3                  0.001
-score MONEY_FRAUD_5                  2.621
+score MONEY_FRAUD_5                  2.463
 score MONEY_FRAUD_8                  0.001
 score MONEY_FREEMAIL_REPTO           0.001
-score MSMAIL_PRI_ABNORMAL            1.499
+score MSMAIL_PRI_ABNORMAL            1.411
 score NA_DOLLARS                     1.499
 score NICE_REPLY_A                   -0.090
-score NO_FM_NAME_IP_HOSTN            0.001 # force non-zero
+score NO_FM_NAME_IP_HOSTN            0.001
 score NSL_RCVD_HELO_USER             0.001
-score NUMBERONLY_BITCOIN_EXP         1.230
-score OBFU_TEXT_ATTACH               1.368
-score ODD_FREEM_REPTO                2.707
+score NUMBERONLY_BITCOIN_EXP         0.465
+score OBFU_TEXT_ATTACH               0.847
+score ODD_FREEM_REPTO                2.655
 score PDS_BAD_THREAD_QP_64           0.001
-score PDS_BTC_ID                     0.212
+score PDS_BTC_ID                     0.499
 score PDS_BTC_MSGID                  0.001
 score PDS_FROM_2_EMAILS              0.001
 score PDS_HELO_SPF_FAIL              1.999
-score PDS_NAKED_TO_NUMERO            2.000
+score PDS_NAKED_TO_NUMERO            1.999
 score PDS_RDNS_DYNAMIC_FP            0.001 # force non-zero
-score PDS_SHORT_SPOOFED_URL          2.000
+score PDS_SHORT_SPOOFED_URL          1.999
 score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 1.347
 score PHP_ORIG_SCRIPT                0.001
-score PHP_SCRIPT                     2.499
+score PHP_SCRIPT                     2.500
 score PP_MIME_FAKE_ASCII_TEXT        0.001
 score RAND_MKTG_HEADER               1.999
-score RATWARE_NO_RDNS                1.850
+score RATWARE_NO_RDNS                2.911
 score RCVD_IN_MSPIKE_H2              -0.001
-score RDNS_NUM_TLD_XM                1.286
+score RDNS_NUM_TLD_XM                2.091
 score REPTO_419_FRAUD                2.999
-score SCC_CANSPAM_1                  2.299
+score SCC_CANSPAM_1                  2.300
 score SCC_ISEMM_LID_1B               0.001
-score SENDGRID_REDIR                 1.063
-score SERGIO_SUBJECT_VIAGRA01        3.341
+score SENDGRID_REDIR                 1.068
+score SERGIO_SUBJECT_VIAGRA01        3.144
 score SHOPIFY_IMG_NOT_RCVD_SFY       2.499
-score SHORTENED_URL_SRC              0.621
+score SHORTENED_URL_SRC              0.591
 score SPOOFED_FREEMAIL               0.001
-score SPOOFED_FREEMAIL_NO_RDNS       0.001
+score SPOOFED_FREEMAIL_NO_RDNS       0.001 # force non-zero
 score SPOOF_GMAIL_MID                0.001
-score STATIC_XPRIO_OLE               0.001
-score SUSP_UTF8_WORD_COMBO           1.469
-score SUSP_UTF8_WORD_MANY            1.999
+score STATIC_XPRIO_OLE               0.001 # force non-zero
+score SUSP_UTF8_WORD_COMBO           1.368
+score SUSP_UTF8_WORD_MANY            2.099
 score SUSP_UTF8_WORD_SUBJ            1.999
-score THIS_AD                        0.999
+score THIS_AD                        1.000
 score TO_EQ_FM_DOM_SPF_FAIL          0.001
 score TO_EQ_FM_SPF_FAIL              0.001
-score TO_NAME_SUBJ_NO_RDNS           2.999
+score TO_NAME_SUBJ_NO_RDNS           3.000
 score TO_NO_BRKTS_HTML_IMG           1.999
 score TO_NO_BRKTS_HTML_ONLY          1.999
 score TO_NO_BRKTS_MSFT               0.001
 score TO_NO_BRKTS_NORDNS_HTML        1.999
 score TO_NO_BRKTS_PCNT               2.499
-score TVD_ENHANCE                    2.036
-score TVD_IP_HEX                     1.538
-score TVD_IP_OCT                     2.340
+score TVD_ENHANCE                    1.083
+score TVD_IP_HEX                     2.416
+score TVD_IP_OCT                     2.383
 score TVD_PH_BODY_META               0.001
+score TVD_SPACE_ENCODED              0.001
 score UNDISC_FREEM                   2.899
 score UNDISC_MONEY                   3.299
 score URI_DOTEDU                     1.999
 score URI_GOOGLE_PROXY               1.999
 score URI_ONLY_MSGID_MALF            0.001
-score URI_PHISH                      3.701
+score URI_PHISH                      3.628
 score URI_TRY_3LD                    1.167
-score URI_WP_DIRINDEX                3.276
-score URI_WP_HACKED                  3.500
+score URI_WP_DIRINDEX                3.031
+score URI_WP_HACKED                  3.499
 score URI_WP_HACKED_2                2.499
 score VFY_ACCT_NORDNS                2.999
 score WORD_INVIS                     0.001
-score WORD_INVIS_MANY                2.999
+score WORD_INVIS_MANY                3.000
 score XFER_LOTSA_MONEY               0.999
 score XM_RANDOM                      0.001
 score XM_RECPTID                     2.999
@@ -284,7 +285,6 @@ score LOTTO_AGENT                    1.0
 score LUCRATIVE                      1.000
 score MALF_HTML_B64                  1.000
 score MALWARE_PASSWORD               1.000
-score MANY_HDRS_LCASE                0.100
 score MIME_NO_TEXT                   1.000
 score MIXED_AREA_CASE                1.000
 score MIXED_CENTER_CASE              1.000

Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1907229&r1=1907228&r2=1907229&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Fri Feb  3 02:40:09 2023
@@ -1,40 +1,40 @@
 ##### WITH NEW RULES AND SCORES #####
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 289201  76.158%  (99.436% of non-spam corpus)
-# Correctly spam:      56289  14.823%  (63.321% of spam corpus)
-# False positives:      1641  0.432%  (0.564% of nonspam,  16142 weighted)
-# False negatives:     32605  8.586%  (36.679% of spam,  41869 weighted)
-# Average score for spam:  9.7    nonspam: 0.7
-# Average for false-pos:   6.4  false-neg: 1.3
-# TOTAL:              379736  100.00%
+# Correctly non-spam: 292444  76.206%  (99.452% of non-spam corpus)
+# Correctly spam:      56385  14.693%  (62.860% of spam corpus)
+# False positives:      1611  0.420%  (0.548% of nonspam,  17538 weighted)
+# False negatives:     33315  8.681%  (37.140% of spam,  43451 weighted)
+# Average score for spam:  9.5    nonspam: 0.7
+# Average for false-pos:   7.1  false-neg: 1.3
+# TOTAL:              383755  100.00%
 
 Reading scores from "tmprules"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  36131  99.43%
-# Correctly spam:       7167  63.79%
-# False positives:       207  0.57%
-# False negatives:      4069  36.21%
-# TCR(l=50): 0.779250  SpamRecall: 63.786%  SpamPrec: 97.193%
+# Correctly non-spam:  36504  99.43%
+# Correctly spam:       7131  62.89%
+# False positives:       211  0.57%
+# False negatives:      4207  37.11%
+# TCR(l=50): 0.768313  SpamRecall: 62.895%  SpamPrec: 97.126%
 
 ##### WITHOUT NEW RULES AND SCORES #####
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 283247  97.39%
-# Correctly spam:      46813  52.66%
-# False positives:      7595  2.61%
-# False negatives:     42081  47.34%
-# TCR(l=50): 0.210734  SpamRecall: 52.662%  SpamPrec: 86.041%
+# Correctly non-spam: 286465  97.42%
+# Correctly spam:      45725  50.98%
+# False positives:      7590  2.58%
+# False negatives:     43975  49.02%
+# TCR(l=50): 0.211819  SpamRecall: 50.975%  SpamPrec: 85.764%
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  35421  97.48%
-# Correctly spam:       5883  52.36%
-# False positives:       917  2.52%
-# False negatives:      5353  47.64%
-# TCR(l=50): 0.219440  SpamRecall: 52.358%  SpamPrec: 86.515%
+# Correctly non-spam:  35757  97.39%
+# Correctly spam:       5773  50.92%
+# False positives:       958  2.61%
+# False negatives:      5565  49.08%
+# TCR(l=50): 0.212064  SpamRecall: 50.917%  SpamPrec: 85.767%

Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1907229&r1=1907228&r2=1907229&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Fri Feb  3 02:40:09 2023
@@ -1,23 +1,23 @@
 ##### WITH NEW RULES AND SCORES #####
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 295937  77.707%  (99.213% of non-spam corpus)
-# Correctly spam:      55286  14.517%  (66.972% of spam corpus)
-# False positives:      2348  0.617%  (0.787% of nonspam,  65145 weighted)
-# False negatives:     27265  7.159%  (33.028% of spam,  41061 weighted)
-# Average score for spam:  15.2    nonspam: -0.2
+# Correctly non-spam: 295945  77.710%  (99.216% of non-spam corpus)
+# Correctly spam:      55300  14.521%  (66.991% of spam corpus)
+# False positives:      2340  0.614%  (0.784% of nonspam,  65025 weighted)
+# False negatives:     27249  7.155%  (33.009% of spam,  40989 weighted)
+# Average score for spam:  15.1    nonspam: -0.2
 # Average for false-pos:   10.0  false-neg: 1.5
-# TOTAL:              380836  100.00%
+# TOTAL:              380834  100.00%
 
 Reading scores from "tmprules"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  36894  99.11%
-# Correctly spam:       7024  67.44%
-# False positives:       330  0.89%
-# False negatives:      3391  32.56%
-# TCR(l=50): 0.523604  SpamRecall: 67.441%  SpamPrec: 95.513%
+# Correctly non-spam:  36896  99.12%
+# Correctly spam:       7026  67.47%
+# False positives:       328  0.88%
+# False negatives:      3388  32.53%
+# TCR(l=50): 0.526279  SpamRecall: 67.467%  SpamPrec: 95.540%
 
 ##### WITHOUT NEW RULES AND SCORES #####
 Reading scores from "../rules-base"...
@@ -25,16 +25,16 @@ Reading per-message hit stat logs and sc
 
 # SUMMARY for threshold 5.0:
 # Correctly non-spam: 296017  99.24%
-# Correctly spam:      47964  58.10%
+# Correctly spam:      47936  58.07%
 # False positives:      2268  0.76%
-# False negatives:     34587  41.90%
-# TCR(l=50): 0.557826  SpamRecall: 58.102%  SpamPrec: 95.485%
+# False negatives:     34613  41.93%
+# TCR(l=50): 0.557715  SpamRecall: 58.070%  SpamPrec: 95.482%
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
 # Correctly non-spam:  36913  99.16%
-# Correctly spam:       6054  58.13%
+# Correctly spam:       6079  58.37%
 # False positives:       311  0.84%
-# False negatives:      4361  41.87%
-# TCR(l=50): 0.523078  SpamRecall: 58.128%  SpamPrec: 95.114%
+# False negatives:      4335  41.63%
+# TCR(l=50): 0.523711  SpamRecall: 58.373%  SpamPrec: 95.133%