You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by sp...@apache.org on 2023/06/10 02:51:15 UTC

svn commit: r1910335 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1

Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1910335&r1=1910334&r2=1910335&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Sat Jun 10 02:51:15 2023
@@ -3,211 +3,210 @@
 
 score ACCT_PHISHING_MANY             2.999
 score AC_DIV_BONANZA                 0.001
-score AC_FROM_MANY_DOTS              3.000
-score AC_HTML_NONSENSE_TAGS          2.000
+score AC_FROM_MANY_DOTS              2.999
+score AC_HTML_NONSENSE_TAGS          1.999
 score ADMITS_SPAM                    0.001
 score ADVANCE_FEE_2_NEW_MONEY        1.999
 score ADVANCE_FEE_3_NEW              3.267
 score ADVANCE_FEE_3_NEW_MONEY        2.599
-score ADVANCE_FEE_4_NEW_MONEY        1.288
+score ADVANCE_FEE_4_NEW_MONEY        1.410
 score ADVANCE_FEE_5_NEW_FRM_MNY      0.001
 score ADVANCE_FEE_5_NEW_MONEY        0.001
-score AD_PREFS                       0.315
+score AD_PREFS                       0.001
 score ALIBABA_IMG_NOT_RCVD_ALI       0.001
 score AMAZON_IMG_NOT_RCVD_AMZN       0.001
 score AXB_XMAILER_MIMEOLE_OL_024C2   0.001
-score BIGNUM_EMAILS_FREEM            0.890
+score BIGNUM_EMAILS_FREEM            0.898
 score BIGNUM_EMAILS_MANY             2.999
-score BITCOIN_DEADLINE               1.914
-score BITCOIN_EXTORT_01              2.648
+score BITCOIN_DEADLINE               1.999
+score BITCOIN_EXTORT_01              2.651
 score BITCOIN_MALF_HTML              0.001
-score BITCOIN_OBFU_SUBJ              1.509
-score BITCOIN_SPAM_02                2.226
-score BITCOIN_SPAM_05                1.147
+score BITCOIN_OBFU_SUBJ              0.652
+score BITCOIN_SPAM_02                1.993
+score BITCOIN_SPAM_05                2.499
 score BITCOIN_SPAM_07                3.499
 score BITCOIN_XPRIO                  0.001
 score BITCOIN_YOUR_INFO              2.999
-score BODY_SINGLE_URI                0.001
+score BODY_SINGLE_URI                0.001 # force non-zero
 score BODY_SINGLE_WORD               0.001
 score BODY_URI_ONLY                  0.001
-score CK_HELO_GENERIC                0.250
+score CK_HELO_GENERIC                0.249
 score CTE_8BIT_MISMATCH              0.001
 score DATE_IN_FUTURE_Q_PLUS          2.499
 score DEAR_BENEFICIARY               0.001
 score DKIMWL_WL_HIGH                 -0.001
-score DKIMWL_WL_MED                  -0.001
+score DKIMWL_WL_MED                  -0.001 # force non-zero
 score DKIMWL_WL_MEDHI                -0.001
 score DOS_BODY_HIGH_NO_MID           0.001
 score END_FUTURE_EMAILS              2.499
 score FAKE_REPLY_A1                  0.001
-score FAKE_REPLY_B                   2.580
-score FILL_THIS_FORM                 0.001
+score FAKE_REPLY_B                   1.811
+score FILL_THIS_FORM                 0.001 # force non-zero
 score FONT_INVIS_DIRECT              0.001
-score FONT_INVIS_LONG_LINE           2.999
+score FONT_INVIS_LONG_LINE           3.000
 score FONT_INVIS_MSGID               0.001
-score FONT_INVIS_POSTEXTRAS          1.390
-score FORGED_SPF_HELO                0.465
-score FORM_FRAUD_5                   0.001 # force non-zero
-score FREEMAIL_FORGED_FROMDOMAIN     0.250
+score FONT_INVIS_POSTEXTRAS          1.389
+score FORGED_SPF_HELO                0.472
+score FORM_FRAUD_5                   0.001
+score FREEMAIL_FORGED_FROMDOMAIN     0.249
 score FROM_2_EMAILS_SHORT            0.001
 score FROM_ADDR_WS                   2.999
 score FROM_FMBLA_NEWDOM28            0.799
 score FROM_GOV_DKIM_AU               -0.001
 score FROM_IN_TO_AND_SUBJ            1.899
-score FROM_MISSPACED                 0.001 # force non-zero
+score FROM_MISSPACED                 0.001
 score FROM_MISSP_DYNIP               2.299
-score FROM_MISSP_EH_MATCH            1.547
+score FROM_MISSP_EH_MATCH            1.548
 score FROM_MISSP_FREEMAIL            2.999
 score FROM_MISSP_MSFT                0.001
-score FROM_MISSP_REPLYTO             0.226
+score FROM_MISSP_REPLYTO             0.240
 score FROM_MISSP_SPF_FAIL            0.001
-score FROM_MISSP_USER                0.001 # force non-zero
+score FROM_MISSP_USER                0.001
 score FROM_MULTI_NORDNS              0.001
-score FROM_PAYPAL_SPOOF              0.001
+score FROM_PAYPAL_SPOOF              1.058
 score FROM_SUSPICIOUS_NTLD           0.001
 score FROM_SUSPICIOUS_NTLD_FP        1.999
-score FROM_UNBAL1                    1.797
-score FROM_UNBAL2                    0.707
+score FROM_UNBAL1                    1.104
+score FROM_UNBAL2                    2.325
 score FROM_WSP_TRAIL                 3.299
 score FSL_BULK_SIG                   0.001
 score FSL_CTYPE_WIN1251              0.001
 score FSL_HELO_FAKE                  0.001
 score FSL_NEW_HELO_USER              0.001
-score FUZZY_AMAZON                   0.001
-score GB_BITCOIN_NH                  1.362
-score GB_CUSTOM_HTM_URI              1.033
+score FUZZY_AMAZON                   0.001 # force non-zero
+score GB_BITCOIN_NH                  1.351
+score GB_CUSTOM_HTM_URI              0.999
 score GB_FAKE_RF_SHORT               1.999
 score GB_FREEMAIL_DISPTO             0.001
-score GB_GOOGLE_TRANSL               0.749
-score GB_HASHBL_BTC                  0.001
-score GOOG_MALWARE_DNLD              3.587
-score GOOG_REDIR_HTML_ONLY           2.000
-score GOOG_REDIR_NORDNS              3.199
-score GOOG_STO_IMG_HTML              3.000
+score GB_HASHBL_BTC                  0.001 # force non-zero
+score GOOG_MALWARE_DNLD              4.265
+score GOOG_REDIR_HTML_ONLY           1.999
+score GOOG_REDIR_NORDNS              3.200
+score GOOG_STO_IMG_HTML              2.999
 score GOOG_STO_IMG_NOHTML            2.499
-score GOOG_STO_NOIMG_HTML            2.945
+score GOOG_STO_NOIMG_HTML            2.952
 score HAS_X_OUTGOING_SPAM_STAT       1.999
 score HDRS_MISSP                     0.001
 score HDR_ORDER_FTSDMCXX_DIRECT      0.001
 score HDR_ORDER_FTSDMCXX_NORDNS      0.001
-score HEADER_FROM_DIFFERENT_DOMAINS  0.250
-score HELO_NO_DOMAIN                 0.015
+score HEADER_FROM_DIFFERENT_DOMAINS  0.249
+score HELO_NO_DOMAIN                 0.001
 score HK_NAME_MR_MRS                 0.999
 score HK_RANDOM_ENVFROM              0.001
-score HK_RANDOM_FROM                 0.001 # force non-zero
+score HK_RANDOM_FROM                 0.001
 score HK_RANDOM_REPLYTO              0.999
 score HK_SCAM                        0.001
-score HOSTED_IMG_DIRECT_MX           0.001
+score HOSTED_IMG_DIRECT_MX           0.001 # force non-zero
 score HOSTED_IMG_MULTI_PUB_01        2.999
 score HTML_ENTITY_ASCII              2.999
-score HTML_ENTITY_ASCII_TINY         0.192
-score HTML_FONT_TINY_NORDNS          0.326
+score HTML_ENTITY_ASCII_TINY         1.092
+score HTML_FONT_TINY_NORDNS          0.331
 score HTML_SINGLET_MANY              2.499
-score HTML_TAG_BALANCE_CENTER        2.699
+score HTML_TAG_BALANCE_CENTER        2.700
 score HTML_TEXT_INVISIBLE_FONT       1.999
 score HTML_TEXT_INVISIBLE_STYLE      0.001
 score JH_SPAMMY_HEADERS              3.499
 score KHOP_HELO_FCRDNS               0.001 # force non-zero
-score LONG_HEX_URI                   2.768
-score LONG_IMG_URI                   0.001
+score LONG_HEX_URI                   2.770
+score LONG_IMG_URI                   0.001 # force non-zero
 score LONG_INVISIBLE_TEXT            2.999
 score LOTS_OF_MONEY                  0.010
 score MALFORMED_FREEMAIL             2.699
-score MALWARE_NORDNS                 1.569
-score MILLION_HUNDRED                0.890
+score MALWARE_NORDNS                 1.629
+score MILLION_HUNDRED                0.887
 score MILLION_USD                    0.001
 score MIMEOLE_DIRECT_TO_MX           0.001
 score MIXED_ES                       2.399
-score MIXED_HREF_CASE                0.071
+score MIXED_HREF_CASE                1.771
 score MONEY_FORM                     0.001
 score MONEY_FORM_SHORT               0.001
 score MONEY_FRAUD_3                  0.001
-score MONEY_FRAUD_5                  0.355
-score MONEY_FRAUD_8                  0.168
-score MONEY_FREEMAIL_REPTO           0.237
-score MONEY_FROM_MISSP               0.001
-score MSMAIL_PRI_ABNORMAL            1.499
+score MONEY_FRAUD_5                  0.155
+score MONEY_FRAUD_8                  0.226
+score MONEY_FREEMAIL_REPTO           0.180
+score MONEY_FROM_MISSP               0.001 # force non-zero
+score MSMAIL_PRI_ABNORMAL            0.711
 score NAME_EMAIL_DIFF                0.001
-score NA_DOLLARS                     0.451
+score NA_DOLLARS                     0.509
 score NICE_REPLY_A                   -0.090
 score NO_FM_NAME_IP_HOSTN            0.001
-score NSL_RCVD_FROM_USER             0.001
-score NSL_RCVD_HELO_USER             0.001 # force non-zero
-score OBFU_TEXT_ATTACH               1.070
-score ODD_FREEM_REPTO                2.458
-score PDS_BTC_ID                     0.001
+score NSL_RCVD_FROM_USER             0.001 # force non-zero
+score NSL_RCVD_HELO_USER             0.001
+score OBFU_TEXT_ATTACH               1.149
+score ODD_FREEM_REPTO                2.489
+score PDS_BTC_ID                     0.001 # force non-zero
 score PDS_BTC_MSGID                  0.001
 score PDS_FRNOM_TODOM_DBL_URL        1.499
 score PDS_FRNOM_TODOM_NAKED_TO       1.499
-score PDS_FROM_2_EMAILS              2.576
+score PDS_FROM_2_EMAILS              2.578
 score PDS_FROM_NAME_TO_DOMAIN        1.999
-score PDS_HP_HELO_NORDNS             0.001 # force non-zero
+score PDS_HP_HELO_NORDNS             0.001
 score PDS_OTHER_BAD_TLD              0.001
 score PDS_RDNS_DYNAMIC_FP            0.001 # force non-zero
 score PDS_TINYSUBJ_URISHRT           1.499
-score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 0.001 # force non-zero
+score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 0.001
 score PDS_TO_EQ_FROM_NAME            0.001
 score PHP_ORIG_SCRIPT                0.001
 score PHP_SCRIPT                     2.499
 score POSSIBLE_GMAIL_PHISHER         2.199
-score PP_MIME_FAKE_ASCII_TEXT        0.001
+score PP_MIME_FAKE_ASCII_TEXT        0.001 # force non-zero
 score RAND_HEADER_MANY               0.001
 score RAND_MKTG_HEADER               1.999
-score RATWARE_NO_RDNS                0.001
+score RATWARE_NO_RDNS                0.001 # force non-zero
 score RCVD_IN_MSPIKE_H2              -0.001
-score READY_TO_SHIP                  0.638
+score READY_TO_SHIP                  0.648
 score SCC_BODY_SINGLE_WORD           0.001 # force non-zero
 score SCC_BODY_URI_ONLY              1.439
-score SCC_CANSPAM_1                  2.479
+score SCC_CANSPAM_1                  0.444
 score SCC_CANSPAM_2                  3.299
-score SCC_ISEMM_LID_1B               0.997
+score SCC_ISEMM_LID_1B               1.003
 score SCC_SPAMMER_ADDR_2             2.799
-score SCC_SPECIAL_GUID               0.844
-score SENDGRID_REDIR                 1.001
-score SERGIO_SUBJECT_PORN014         2.825
+score SCC_SPECIAL_GUID               1.887
+score SENDGRID_REDIR                 0.998
+score SERGIO_SUBJECT_PORN014         2.826
 score SERGIO_SUBJECT_VIAGRA01        0.001
 score SHOPIFY_IMG_NOT_RCVD_SFY       2.499
-score SHORT_SHORTNER                 0.300
+score SHORT_SHORTNER                 0.299
 score SPOOFED_FREEMAIL               0.001
 score SPOOFED_FREEMAIL_NO_RDNS       0.001
 score SPOOFED_FREEM_REPTO            0.001
 score SPOOF_GMAIL_MID                0.001
 score STATIC_XPRIO_OLE               0.001
 score SUSP_UTF8_WORD_COMBO           2.999
-score SUSP_UTF8_WORD_SUBJ            0.362
-score THIS_AD                        0.999
-score TO_EQ_FM_DIRECT_MX             0.151
-score TO_EQ_FM_DOM_SPF_FAIL          0.087
-score TO_EQ_FM_HTML_ONLY             2.199
+score SUSP_UTF8_WORD_SUBJ            0.369
+score THIS_AD                        1.000
+score TO_EQ_FM_DIRECT_MX             0.253
+score TO_EQ_FM_DOM_SPF_FAIL          0.001 # force non-zero
+score TO_EQ_FM_HTML_ONLY             2.200
 score TO_EQ_FM_SPF_FAIL              0.001
 score TO_IN_SUBJ                     0.100
-score TO_NO_BRKTS_FROM_MSSP          0.461
+score TO_NO_BRKTS_FROM_MSSP          0.451
 score TO_NO_BRKTS_HTML_IMG           1.999
 score TO_NO_BRKTS_HTML_ONLY          1.999
-score TO_NO_BRKTS_MSFT               1.179
-score TO_NO_BRKTS_NORDNS_HTML        2.000
+score TO_NO_BRKTS_MSFT               1.177
+score TO_NO_BRKTS_NORDNS_HTML        1.999
 score TO_NO_BRKTS_PCNT               2.499
 score TVD_SPACE_ENCODED              0.001
 score TVD_SPACE_RATIO_MINFP          0.001
 score UNDISC_FREEM                   2.699
-score UNDISC_MONEY                   1.266
+score UNDISC_MONEY                   1.340
 score UNICODE_OBFU_ASC               2.499
 score URI_DOTEDU                     1.999
-score URI_GOOGLE_PROXY               2.699
+score URI_GOOGLE_PROXY               2.700
 score URI_ONLY_MSGID_MALF            1.999
-score URI_PHISH                      3.963
-score URI_TRY_3LD                    1.682
+score URI_PHISH                      3.999
+score URI_TRY_3LD                    1.681
 score URI_WPADMIN                    2.299
-score URI_WP_HACKED                  1.585
+score URI_WP_HACKED                  1.589
 score URI_WP_HACKED_2                2.499
-score VFY_ACCT_NORDNS                2.623
-score WORD_INVIS                     0.502
+score VFY_ACCT_NORDNS                2.625
+score WORD_INVIS                     0.504
 score WORD_INVIS_MANY                2.996
 score XFER_LOTSA_MONEY               0.001
-score XM_DIGITS_ONLY                 0.273
+score XM_DIGITS_ONLY                 1.797
 score XM_RANDOM                      0.001 # force non-zero
-score XM_RECPTID                     2.024
-score XPRIO                          0.001
+score XM_RECPTID                     2.025
+score XPRIO                          0.001 # force non-zero
 score AC_BR_BONANZA                  0.001
 score AC_POST_EXTRAS                 1.000
 score AC_SPAMMY_URI_PATTERNS1        1.000

Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1910335&r1=1910334&r2=1910335&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Sat Jun 10 02:51:15 2023
@@ -1,40 +1,40 @@
 ##### WITH NEW RULES AND SCORES #####
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 393769  50.135%  (99.248% of non-spam corpus)
-# Correctly spam:     239174  30.452%  (61.538% of spam corpus)
-# False positives:      2984  0.380%  (0.752% of nonspam, 100602 weighted)
-# False negatives:    149484  19.033%  (38.462% of spam, 242229 weighted)
-# Average score for spam:  8.8    nonspam: 0.7
+# Correctly non-spam: 393946  49.736%  (99.244% of non-spam corpus)
+# Correctly spam:     241706  30.516%  (61.172% of spam corpus)
+# False positives:      3002  0.379%  (0.756% of nonspam, 103452 weighted)
+# False negatives:    153422  19.370%  (38.828% of spam, 250773 weighted)
+# Average score for spam:  8.7    nonspam: 0.7
 # Average for false-pos:   6.9  false-neg: 1.6
-# TOTAL:              785411  100.00%
+# TOTAL:              792076  100.00%
 
 Reading scores from "tmprules"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  49129  99.28%
-# Correctly spam:      29678  61.25%
-# False positives:       356  0.72%
-# False negatives:     18776  38.75%
-# TCR(l=50): 1.324748  SpamRecall: 61.250%  SpamPrec: 98.815%
+# Correctly non-spam:  49157  99.27%
+# Correctly spam:      30156  61.17%
+# False positives:       363  0.73%
+# False negatives:     19140  38.83%
+# TCR(l=50): 1.321963  SpamRecall: 61.173%  SpamPrec: 98.811%
 
 ##### WITHOUT NEW RULES AND SCORES #####
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 388191  97.84%
-# Correctly spam:     135037  34.74%
-# False positives:      8562  2.16%
-# False negatives:    253621  65.26%
-# TCR(l=50): 0.570113  SpamRecall: 34.744%  SpamPrec: 94.038%
+# Correctly non-spam: 388366  97.84%
+# Correctly spam:     136023  34.43%
+# False positives:      8582  2.16%
+# False negatives:    259105  65.57%
+# TCR(l=50): 0.574143  SpamRecall: 34.425%  SpamPrec: 94.065%
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  48382  97.77%
-# Correctly spam:      17037  35.16%
-# False positives:      1103  2.23%
-# False negatives:     31417  64.84%
-# TCR(l=50): 0.559728  SpamRecall: 35.161%  SpamPrec: 93.920%
+# Correctly non-spam:  48454  97.85%
+# Correctly spam:      17149  34.79%
+# False positives:      1066  2.15%
+# False negatives:     32147  65.21%
+# TCR(l=50): 0.576919  SpamRecall: 34.788%  SpamPrec: 94.148%

Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1910335&r1=1910334&r2=1910335&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Sat Jun 10 02:51:15 2023
@@ -1,23 +1,23 @@
 ##### WITH NEW RULES AND SCORES #####
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 369811  73.372%  (98.881% of non-spam corpus)
-# Correctly spam:      90840  18.023%  (69.863% of spam corpus)
-# False positives:      4186  0.831%  (1.119% of nonspam, 163347 weighted)
-# False negatives:     39185  7.774%  (30.137% of spam,  50835 weighted)
-# Average score for spam:  15.2    nonspam: -0.2
-# Average for false-pos:   11.2  false-neg: 1.3
+# Correctly non-spam: 369740  73.358%  (98.862% of non-spam corpus)
+# Correctly spam:      90824  18.020%  (69.851% of spam corpus)
+# False positives:      4257  0.845%  (1.138% of nonspam, 164566 weighted)
+# False negatives:     39201  7.778%  (30.149% of spam,  50862 weighted)
+# Average score for spam:  14.9    nonspam: -0.2
+# Average for false-pos:   11.1  false-neg: 1.3
 # TOTAL:              504022  100.00%
 
 Reading scores from "tmprules"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam:  46047  98.84%
-# Correctly spam:      11421  70.00%
-# False positives:       539  1.16%
-# False negatives:      4895  30.00%
-# TCR(l=50): 0.512357  SpamRecall: 69.999%  SpamPrec: 95.493%
+# Correctly non-spam:  46049  98.85%
+# Correctly spam:      11422  70.00%
+# False positives:       537  1.15%
+# False negatives:      4894  30.00%
+# TCR(l=50): 0.513987  SpamRecall: 70.005%  SpamPrec: 95.510%
 
 ##### WITHOUT NEW RULES AND SCORES #####
 Reading scores from "../rules-base"...