You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by sp...@apache.org on 2023/02/02 02:39:36 UTC

svn commit: r1907212 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1

Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1907212&r1=1907211&r2=1907212&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Thu Feb  2 02:39:36 2023
@@ -3,39 +3,40 @@
 
 score AC_BR_BONANZA                  0.001
 score AC_DIV_BONANZA                 0.001
-score AC_FROM_MANY_DOTS              1.740
+score AC_FROM_MANY_DOTS              2.707
 score AC_HTML_NONSENSE_TAGS          1.999
 score ADMITS_SPAM                    0.001
-score ADVANCE_FEE_2_NEW_FRM_MNY      1.455
+score ADVANCE_FEE_2_NEW_FRM_MNY      1.507
 score ADVANCE_FEE_2_NEW_MONEY        1.999
-score ADVANCE_FEE_3_NEW              3.500
-score ADVANCE_FEE_3_NEW_MONEY        2.499
+score ADVANCE_FEE_3_NEW              3.499
+score ADVANCE_FEE_3_NEW_MONEY        2.291
 score ADVANCE_FEE_4_NEW              2.599
-score ADVANCE_FEE_4_NEW_MONEY        1.581
-score ADVANCE_FEE_5_NEW_FRM_MNY      0.001 # force non-zero
-score ADVANCE_FEE_5_NEW_MONEY        0.935
-score AD_PREFS                       0.153
+score ADVANCE_FEE_4_NEW_FRM_MNY      0.552
+score ADVANCE_FEE_4_NEW_MONEY        1.582
+score ADVANCE_FEE_5_NEW_FRM_MNY      0.001
+score ADVANCE_FEE_5_NEW_MONEY        0.749
+score AD_PREFS                       0.415
 score AMAZON_IMG_NOT_RCVD_AMZN       0.001
-score AXB_XMAILER_MIMEOLE_OL_024C2   0.001
-score BIGNUM_EMAILS_FREEM            0.948
-score BIGNUM_EMAILS_MANY             2.999
-score BITCOIN_DEADLINE               2.519
-score BITCOIN_EXTORT_01              1.648
-score BITCOIN_MALF_HTML              0.207
-score BITCOIN_MALWARE                1.297
-score BITCOIN_OBFU_SUBJ              0.078
-score BITCOIN_SPAM_02                1.466
-score BITCOIN_SPAM_05                0.176
+score AXB_XMAILER_MIMEOLE_OL_024C2   0.001 # force non-zero
+score BIGNUM_EMAILS_FREEM            2.127
+score BIGNUM_EMAILS_MANY             3.000
+score BITCOIN_DEADLINE               2.517
+score BITCOIN_EXTORT_01              1.645
+score BITCOIN_MALF_HTML              1.491
+score BITCOIN_MALWARE                2.483
+score BITCOIN_OBFU_SUBJ              0.973
+score BITCOIN_SPAM_02                1.454
+score BITCOIN_SPAM_05                0.915
 score BITCOIN_SPAM_09                1.499
-score BITCOIN_XPRIO                  0.396
+score BITCOIN_XPRIO                  0.575
 score BITCOIN_YOUR_INFO              2.999
-score BODY_URI_ONLY                  2.379
+score BODY_URI_ONLY                  2.378
 score CK_HELO_GENERIC                0.249
 score CONTENT_AFTER_HTML_WEAK        1.499
 score CTE_8BIT_MISMATCH              0.001
-score DEAR_BENEFICIARY               1.326
-score DEAR_EMAIL_USER                1.293
-score DKIMWL_WL_HIGH                 -0.001 # force non-zero
+score DEAR_BENEFICIARY               1.200
+score DEAR_EMAIL_USER                1.997
+score DKIMWL_WL_HIGH                 -0.001
 score DKIMWL_WL_MED                  -0.001
 score DKIMWL_WL_MEDHI                -0.001
 score DX_TEXT_03                     1.799
@@ -44,39 +45,40 @@ score END_FUTURE_EMAILS              2.4
 score FILL_THIS_FORM                 0.001
 score FONT_INVIS_DIRECT              0.001
 score FONT_INVIS_LONG_LINE           2.999
-score FONT_INVIS_MSGID               2.174
-score FONT_INVIS_POSTEXTRAS          0.136
+score FONT_INVIS_MSGID               2.202
+score FONT_INVIS_POSTEXTRAS          0.001
 score FORGED_SPF_HELO                1.355
-score FORM_FRAUD                     0.999
-score FORM_FRAUD_3                   0.690
-score FORM_FRAUD_5                   1.450
+score FORM_FRAUD                     1.000
+score FORM_FRAUD_3                   1.347
+score FORM_FRAUD_5                   0.673
 score FREEMAIL_FORGED_FROMDOMAIN     0.250
-score FROM_2_EMAILS_SHORT            2.246
-score FROM_ADDR_WS                   2.999
+score FROM_2_EMAILS_SHORT            2.452
+score FROM_ADDR_WS                   3.000
 score FROM_FMBLA_NEWDOM              0.001
 score FROM_FMBLA_NEWDOM28            0.799
 score FROM_GOV_DKIM_AU               -0.999
 score FROM_MISSP_EH_MATCH            1.999
+score FROM_MISSP_REPLYTO             0.001 # force non-zero
 score FROM_MISSP_SPF_FAIL            1.999
-score FROM_MULTI_NORDNS              0.915
-score FROM_PAYPAL_SPOOF              0.919
+score FROM_MULTI_NORDNS              0.713
+score FROM_PAYPAL_SPOOF              0.937
 score FROM_SUSPICIOUS_NTLD           0.500
 score FROM_SUSPICIOUS_NTLD_FP        1.999
 score FSL_BULK_SIG                   0.001
 score FSL_NEW_HELO_USER              0.001
 score FUZZY_AMAZON                   0.001
-score FUZZY_CLICK_HERE               2.792
-score FUZZY_UNSUBSCRIBE              3.100
-score GB_CUSTOM_HTM_URI              0.040
+score FUZZY_CLICK_HERE               2.228
+score FUZZY_UNSUBSCRIBE              3.099
+score GB_CUSTOM_HTM_URI              0.392
 score GB_FAKE_RF_SHORT               0.826
-score GB_FREEMAIL_DISPTO             0.001
-score GB_HASHBL_BTC                  2.910
+score GB_FREEMAIL_DISPTO             0.001 # force non-zero
+score GB_HASHBL_BTC                  2.019
 score GOOG_REDIR_NORDNS              2.799
-score GOOG_STO_IMG_HTML              1.970
-score GOOG_STO_NOIMG_HTML            2.948
-score HAS_X_OUTGOING_SPAM_STAT       0.792
-score HDRS_LCASE_IMGONLY             0.100
-score HDRS_MISSP                     1.398
+score GOOG_STO_IMG_HTML              1.883
+score GOOG_STO_NOIMG_HTML            2.949
+score HAS_X_OUTGOING_SPAM_STAT       0.795
+score HDRS_LCASE_IMGONLY             0.099
+score HDRS_MISSP                     1.400
 score HDR_ORDER_FTSDMCXX_DIRECT      0.001
 score HDR_ORDER_FTSDMCXX_NORDNS      0.001
 score HEADER_FROM_DIFFERENT_DOMAINS  0.250
@@ -86,68 +88,68 @@ score HK_RANDOM_ENVFROM              0.0
 score HK_RANDOM_FROM                 1.000
 score HK_RANDOM_REPLYTO              0.999
 score HK_SCAM                        1.999
-score HOSTED_IMG_DIRECT_MX           0.001
-score HOSTED_IMG_FREEM               2.190
+score HOSTED_IMG_DIRECT_MX           0.001 # force non-zero
+score HOSTED_IMG_FREEM               2.188
 score HOSTED_IMG_MULTI_PUB_01        2.999
 score HTML_OFF_PAGE                  0.001
 score HTML_TAG_BALANCE_CENTER        3.599
-score HTML_TEXT_INVISIBLE_FONT       0.276
-score HTML_TEXT_INVISIBLE_STYLE      2.805
+score HTML_TEXT_INVISIBLE_FONT       0.250
+score HTML_TEXT_INVISIBLE_STYLE      2.801
 score JH_SPAMMY_HEADERS              3.499
-score KHOP_HELO_FCRDNS               0.001
-score LONG_HEX_URI                   2.669
+score KHOP_HELO_FCRDNS               0.001 # force non-zero
+score LONG_HEX_URI                   2.658
 score LONG_IMG_URI                   0.001
-score LONG_INVISIBLE_TEXT            3.000
+score LONG_INVISIBLE_TEXT            2.999
 score LOTS_OF_MONEY                  0.010
-score MALWARE_NORDNS                 1.096
-score MILLION_HUNDRED                2.600
-score MILLION_USD                    1.050
+score MALWARE_NORDNS                 0.307
+score MILLION_HUNDRED                2.599
+score MILLION_USD                    1.031
 score MIMEOLE_DIRECT_TO_MX           0.001
-score MIXED_HREF_CASE                1.995
-score MONEY_ATM_CARD                 2.050
-score MONEY_FORM                     0.332
+score MIXED_HREF_CASE                0.047
+score MONEY_ATM_CARD                 2.479
+score MONEY_FORM                     0.331
 score MONEY_FORM_SHORT               2.499
 score MONEY_FRAUD_3                  0.001
-score MONEY_FRAUD_5                  1.287
-score MONEY_FRAUD_8                  0.001 # force non-zero
+score MONEY_FRAUD_5                  2.621
+score MONEY_FRAUD_8                  0.001
 score MONEY_FREEMAIL_REPTO           0.001
-score MSMAIL_PRI_ABNORMAL            0.589
+score MSMAIL_PRI_ABNORMAL            1.499
 score NA_DOLLARS                     1.499
 score NICE_REPLY_A                   -0.090
-score NO_FM_NAME_IP_HOSTN            0.001
+score NO_FM_NAME_IP_HOSTN            0.001 # force non-zero
 score NSL_RCVD_HELO_USER             0.001
-score NUMBERONLY_BITCOIN_EXP         0.610
-score OBFU_TEXT_ATTACH               1.206
-score ODD_FREEM_REPTO                2.945
+score NUMBERONLY_BITCOIN_EXP         1.230
+score OBFU_TEXT_ATTACH               1.368
+score ODD_FREEM_REPTO                2.707
 score PDS_BAD_THREAD_QP_64           0.001
-score PDS_BTC_ID                     0.205
+score PDS_BTC_ID                     0.212
 score PDS_BTC_MSGID                  0.001
 score PDS_FROM_2_EMAILS              0.001
-score PDS_HELO_SPF_FAIL              2.000
-score PDS_NAKED_TO_NUMERO            0.376
+score PDS_HELO_SPF_FAIL              1.999
+score PDS_NAKED_TO_NUMERO            2.000
 score PDS_RDNS_DYNAMIC_FP            0.001 # force non-zero
-score PDS_SHORT_SPOOFED_URL          1.999
-score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 1.348
-score PHP_ORIG_SCRIPT                0.001 # force non-zero
-score PHP_SCRIPT                     2.500
+score PDS_SHORT_SPOOFED_URL          2.000
+score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 1.347
+score PHP_ORIG_SCRIPT                0.001
+score PHP_SCRIPT                     2.499
 score PP_MIME_FAKE_ASCII_TEXT        0.001
 score RAND_MKTG_HEADER               1.999
-score RATWARE_NO_RDNS                1.187
+score RATWARE_NO_RDNS                1.850
 score RCVD_IN_MSPIKE_H2              -0.001
-score RDNS_NUM_TLD_XM                2.833
+score RDNS_NUM_TLD_XM                1.286
 score REPTO_419_FRAUD                2.999
 score SCC_CANSPAM_1                  2.299
 score SCC_ISEMM_LID_1B               0.001
-score SENDGRID_REDIR                 1.068
-score SERGIO_SUBJECT_VIAGRA01        0.744
+score SENDGRID_REDIR                 1.063
+score SERGIO_SUBJECT_VIAGRA01        3.341
 score SHOPIFY_IMG_NOT_RCVD_SFY       2.499
-score SHORTENED_URL_SRC              2.799
+score SHORTENED_URL_SRC              0.621
 score SPOOFED_FREEMAIL               0.001
 score SPOOFED_FREEMAIL_NO_RDNS       0.001
 score SPOOF_GMAIL_MID                0.001
 score STATIC_XPRIO_OLE               0.001
-score SUSP_UTF8_WORD_COMBO           1.247
-score SUSP_UTF8_WORD_MANY            2.221
+score SUSP_UTF8_WORD_COMBO           1.469
+score SUSP_UTF8_WORD_MANY            1.999
 score SUSP_UTF8_WORD_SUBJ            1.999
 score THIS_AD                        0.999
 score TO_EQ_FM_DOM_SPF_FAIL          0.001
@@ -155,21 +157,21 @@ score TO_EQ_FM_SPF_FAIL              0.0
 score TO_NAME_SUBJ_NO_RDNS           2.999
 score TO_NO_BRKTS_HTML_IMG           1.999
 score TO_NO_BRKTS_HTML_ONLY          1.999
+score TO_NO_BRKTS_MSFT               0.001
 score TO_NO_BRKTS_NORDNS_HTML        1.999
 score TO_NO_BRKTS_PCNT               2.499
-score TVD_ENHANCE                    1.910
-score TVD_IP_HEX                     1.376
-score TVD_IP_OCT                     2.386
-score TVD_PH_BODY_META               0.001 # force non-zero
-score TVD_SPACE_ENCODED              0.001
-score UNDISC_FREEM                   2.799
-score UNDISC_MONEY                   3.199
+score TVD_ENHANCE                    2.036
+score TVD_IP_HEX                     1.538
+score TVD_IP_OCT                     2.340
+score TVD_PH_BODY_META               0.001
+score UNDISC_FREEM                   2.899
+score UNDISC_MONEY                   3.299
 score URI_DOTEDU                     1.999
 score URI_GOOGLE_PROXY               1.999
 score URI_ONLY_MSGID_MALF            0.001
-score URI_PHISH                      3.695
-score URI_TRY_3LD                    1.166
-score URI_WP_DIRINDEX                3.439
+score URI_PHISH                      3.701
+score URI_TRY_3LD                    1.167
+score URI_WP_DIRINDEX                3.276
 score URI_WP_HACKED                  3.500
 score URI_WP_HACKED_2                2.499
 score VFY_ACCT_NORDNS                2.999
@@ -178,7 +180,7 @@ score WORD_INVIS_MANY                2.9
 score XFER_LOTSA_MONEY               0.999
 score XM_RANDOM                      0.001
 score XM_RECPTID                     2.999
-score XPRIO                          0.001
+score XPRIO                          0.001 # force non-zero
 score YOU_INHERIT                    0.001
 score AC_POST_EXTRAS                 1.000
 score AC_SPAMMY_URI_PATTERNS1        1.000
@@ -282,6 +284,7 @@ score LOTTO_AGENT                    1.0
 score LUCRATIVE                      1.000
 score MALF_HTML_B64                  1.000
 score MALWARE_PASSWORD               1.000
+score MANY_HDRS_LCASE                0.100
 score MIME_NO_TEXT                   1.000
 score MIXED_AREA_CASE                1.000
 score MIXED_CENTER_CASE              1.000

Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1907212&r1=1907211&r2=1907212&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Thu Feb  2 02:39:36 2023
@@ -1,40 +1,40 @@
 ##### WITH NEW RULES AND SCORES #####
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 297089  76.636%  (99.453% of non-spam corpus)
-# Correctly spam:      56876  14.672%  (63.949% of spam corpus)
-# False positives:      1633  0.421%  (0.547% of nonspam,  17049 weighted)
-# False negatives:     32064  8.271%  (36.051% of spam,  41074 weighted)
-# Average score for spam:  9.9    nonspam: 0.7
-# Average for false-pos:   7.0  false-neg: 1.3
-# TOTAL:              387662  100.00%
+# Correctly non-spam: 289201  76.158%  (99.436% of non-spam corpus)
+# Correctly spam:      56289  14.823%  (63.321% of spam corpus)
+# False positives:      1641  0.432%  (0.564% of nonspam,  16142 weighted)
+# False negatives:     32605  8.586%  (36.679% of spam,  41869 weighted)
+# Average score for spam:  9.7    nonspam: 0.7
+# Average for false-pos:   6.4  false-neg: 1.3
+# TOTAL:              379736  100.00%
 
 Reading scores from "tmprules"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  37078  99.45%
-# Correctly spam:       7297  64.93%
-# False positives:       205  0.55%
-# False negatives:      3942  35.07%
-# TCR(l=50): 0.791925  SpamRecall: 64.926%  SpamPrec: 97.267%
+# Correctly non-spam:  36131  99.43%
+# Correctly spam:       7167  63.79%
+# False positives:       207  0.57%
+# False negatives:      4069  36.21%
+# TCR(l=50): 0.779250  SpamRecall: 63.786%  SpamPrec: 97.193%
 
 ##### WITHOUT NEW RULES AND SCORES #####
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 291237  97.49%
-# Correctly spam:      47843  53.79%
-# False positives:      7485  2.51%
-# False negatives:     41097  46.21%
-# TCR(l=50): 0.214134  SpamRecall: 53.792%  SpamPrec: 86.472%
+# Correctly non-spam: 283247  97.39%
+# Correctly spam:      46813  52.66%
+# False positives:      7595  2.61%
+# False negatives:     42081  47.34%
+# TCR(l=50): 0.210734  SpamRecall: 52.662%  SpamPrec: 86.041%
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  36382  97.58%
-# Correctly spam:       6021  53.57%
-# False positives:       901  2.42%
-# False negatives:      5218  46.43%
-# TCR(l=50): 0.223582  SpamRecall: 53.572%  SpamPrec: 86.984%
+# Correctly non-spam:  35421  97.48%
+# Correctly spam:       5883  52.36%
+# False positives:       917  2.52%
+# False negatives:      5353  47.64%
+# TCR(l=50): 0.219440  SpamRecall: 52.358%  SpamPrec: 86.515%

Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1907212&r1=1907211&r2=1907212&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Thu Feb  2 02:39:36 2023
@@ -2,22 +2,22 @@
 
 # SUMMARY for threshold 5.0:
 # Correctly non-spam: 295937  77.707%  (99.213% of non-spam corpus)
-# Correctly spam:      55307  14.522%  (66.997% of spam corpus)
-# False positives:      2348  0.617%  (0.787% of nonspam,  65142 weighted)
-# False negatives:     27245  7.154%  (33.003% of spam,  40970 weighted)
-# Average score for spam:  14.7    nonspam: -0.2
+# Correctly spam:      55286  14.517%  (66.972% of spam corpus)
+# False positives:      2348  0.617%  (0.787% of nonspam,  65145 weighted)
+# False negatives:     27265  7.159%  (33.028% of spam,  41061 weighted)
+# Average score for spam:  15.2    nonspam: -0.2
 # Average for false-pos:   10.0  false-neg: 1.5
-# TOTAL:              380837  100.00%
+# TOTAL:              380836  100.00%
 
 Reading scores from "tmprules"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  36895  99.12%
-# Correctly spam:       7023  67.43%
-# False positives:       329  0.88%
-# False negatives:      3392  32.57%
-# TCR(l=50): 0.524897  SpamRecall: 67.432%  SpamPrec: 95.525%
+# Correctly non-spam:  36894  99.11%
+# Correctly spam:       7024  67.44%
+# False positives:       330  0.89%
+# False negatives:      3391  32.56%
+# TCR(l=50): 0.523604  SpamRecall: 67.441%  SpamPrec: 95.513%
 
 ##### WITHOUT NEW RULES AND SCORES #####
 Reading scores from "../rules-base"...
@@ -25,16 +25,16 @@ Reading per-message hit stat logs and sc
 
 # SUMMARY for threshold 5.0:
 # Correctly non-spam: 296017  99.24%
-# Correctly spam:      47934  58.07%
+# Correctly spam:      47964  58.10%
 # False positives:      2268  0.76%
-# False negatives:     34618  41.93%
-# TCR(l=50): 0.557716  SpamRecall: 58.065%  SpamPrec: 95.482%
+# False negatives:     34587  41.90%
+# TCR(l=50): 0.557826  SpamRecall: 58.102%  SpamPrec: 95.485%
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
 # Correctly non-spam:  36913  99.16%
-# Correctly spam:       6070  58.28%
+# Correctly spam:       6054  58.13%
 # False positives:       311  0.84%
-# False negatives:      4345  41.72%
-# TCR(l=50): 0.523498  SpamRecall: 58.281%  SpamPrec: 95.126%
+# False negatives:      4361  41.87%
+# TCR(l=50): 0.523078  SpamRecall: 58.128%  SpamPrec: 95.114%