You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by sp...@apache.org on 2020/09/26 03:25:10 UTC

svn commit: r1882031 [2/2] - in /spamassassin/trunk/rulesrc/scores: 72_scores.cf scores-set0 scores-set1 scores-set2 scores-set3 stats-set0 stats-set1

Modified: spamassassin/trunk/rulesrc/scores/scores-set3
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/scores-set3?rev=1882031&r1=1882030&r2=1882031&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/scores-set3 (original)
+++ spamassassin/trunk/rulesrc/scores/scores-set3 Sat Sep 26 03:25:10 2020
@@ -3,190 +3,190 @@
 
 score AC_BR_BONANZA                  0.001
 score AC_DIV_BONANZA                 0.001
-score AC_FROM_MANY_DOTS              2.027
+score AC_FROM_MANY_DOTS              1.906
 score AC_HTML_NONSENSE_TAGS          1.997
 score AC_POST_EXTRAS                 0.001
-score ADMITS_SPAM                    0.001
+score ADMITS_SPAM                    0.156
 score ADVANCE_FEE_2_NEW_MONEY        1.997
-score ADVANCE_FEE_3_NEW_MONEY        2.696
-score ADVANCE_FEE_4_NEW_MONEY        2.198
+score ADVANCE_FEE_3_NEW_MONEY        1.477
+score ADVANCE_FEE_4_NEW_MONEY        2.197
 score ADVANCE_FEE_5_NEW              2.896
-score AMAZON_IMG_NOT_RCVD_AMZN       0.301
+score AMAZON_IMG_NOT_RCVD_AMZN       0.993
 score AXB_XMAILER_MIMEOLE_OL_024C2   0.001
-score BITCOIN_DEADLINE               2.996
-score BITCOIN_EXTORT_01              4.712
+score BITCOIN_DEADLINE               2.843
+score BITCOIN_EXTORT_01              4.766
 score BITCOIN_MALF_HTML              3.496
-score BITCOIN_SPAM_02                2.038
+score BITCOIN_SPAM_02                1.532
 score BITCOIN_SPAM_04                1.498
-score BITCOIN_SPAM_05                1.749
+score BITCOIN_SPAM_05                2.076
 score BITCOIN_XPRIO                  2.497
-score BITCOIN_YOUR_INFO              0.615
+score BITCOIN_YOUR_INFO              0.577
 score BODY_URI_ONLY                  0.001
 score BOGUS_MIME_VERSION             3.496
-score CK_HELO_DYNAMIC_SPLIT_IP       0.593
+score CK_HELO_DYNAMIC_SPLIT_IP       0.314
 score CK_HELO_GENERIC                0.248
-score CTE_8BIT_MISMATCH              0.998
-score CTYPE_NULL                     2.394
+score CTE_8BIT_MISMATCH              0.999
+score CTYPE_NULL                     2.621
 score DKIMWL_BL                      2.996
-score DKIMWL_WL_HIGH                 -1.199
-score DKIMWL_WL_MED                  -0.001
+score DKIMWL_WL_HIGH                 -1.200
+score DKIMWL_WL_MED                  -0.001 # force non-zero
 score DOTGOV_IMAGE                   2.996
 score DSN_NO_MIMEVERSION             1.997
 score DX_TEXT_03                     0.898
-score END_FUTURE_EMAILS              1.048
-score FILL_THIS_FORM                 0.455
+score END_FUTURE_EMAILS              1.044
+score FILL_THIS_FORM                 1.394
 score FONT_INVIS_DIRECT              0.001
 score FONT_INVIS_DOTGOV              0.001
-score FONT_INVIS_LONG_LINE           0.009
+score FONT_INVIS_LONG_LINE           0.010
 score FONT_INVIS_MSGID               0.001
-score FONT_INVIS_POSTEXTRAS          2.019
+score FONT_INVIS_POSTEXTRAS          3.415
 score FORGED_RELAY_MUA_TO_MX         3.995
-score FORGED_SPF_HELO                1.997
-score FORM_FRAUD                     0.999
-score FORM_FRAUD_5                   2.896
+score FORGED_SPF_HELO                2.097
+score FORM_FRAUD                     0.998
+score FORM_FRAUD_5                   2.996
 score FOUND_YOU                      3.246
-score FREEMAIL_FORGED_FROMDOMAIN     0.001
-score FROM_2_EMAILS_SHORT            0.729
-score FROM_ADDR_WS                   2.996
+score FREEMAIL_FORGED_FROMDOMAIN     0.001 # force non-zero
+score FROM_2_EMAILS_SHORT            0.631
+score FROM_ADDR_WS                   2.816
 score FROM_FMBLA_NEWDOM              1.498
-score FROM_FMBLA_NEWDOM14            0.998
+score FROM_FMBLA_NEWDOM14            0.999
 score FROM_FMBLA_NEWDOM28            0.798
-score FROM_GOV_DKIM_AU               -0.001
+score FROM_GOV_DKIM_AU               -0.998
 score FROM_GOV_SPOOF                 0.998
 score FROM_MISSPACED                 0.001
 score FROM_MISSP_DYNIP               1.660
 score FROM_MISSP_EH_MATCH            0.001
-score FROM_MISSP_FREEMAIL            2.305
+score FROM_MISSP_FREEMAIL            0.651
 score FROM_MISSP_MSFT                0.001
-score FROM_MISSP_REPLYTO             0.001
-score FROM_MISSP_SPF_FAIL            1.999
-score FROM_MISSP_TO_UNDISC           0.322
+score FROM_MISSP_REPLYTO             0.001 # force non-zero
+score FROM_MISSP_SPF_FAIL            1.997
+score FROM_MISSP_TO_UNDISC           1.596
 score FROM_MISSP_USER                0.001
 score FROM_MISSP_XPRIO               0.001
 score FROM_NAME_EQ_TO_G_DRIVE        0.001
 score FROM_NTLD_REPLY_FREEMAIL       0.001
 score FROM_SUSPICIOUS_NTLD           0.498
-score FROM_SUSPICIOUS_NTLD_FP        1.156
-score FROM_UNBAL1                    2.186
-score FROM_WORDY                     1.970
+score FROM_SUSPICIOUS_NTLD_FP        1.075
+score FROM_UNBAL1                    2.381
+score FROM_WORDY                     2.092
 score FSL_BULK_SIG                   0.001
 score FSL_CTYPE_WIN1251              0.001
 score FSL_NEW_HELO_USER              0.001
-score FSL_THIS_IS_ADV                0.647
+score FSL_THIS_IS_ADV                0.487
 score GB_FREEMAIL_DISPTO             0.001
 score GB_GOOGLE_OBFUS                0.748
-score HDRS_LCASE                     0.098
+score HDRS_LCASE                     0.099
 score HDRS_LCASE_IMGONLY             0.099
-score HDR_ORDER_FTSDMCXX_DIRECT      0.810
-score HDR_ORDER_FTSDMCXX_NORDNS      0.723
-score HEADER_FROM_DIFFERENT_DOMAINS  0.248
-score HELO_MISC_IP                   0.027
+score HDR_ORDER_FTSDMCXX_DIRECT      0.821
+score HDR_ORDER_FTSDMCXX_NORDNS      0.581
+score HEADER_FROM_DIFFERENT_DOMAINS  0.249
+score HELO_MISC_IP                   0.149
 score HELO_NO_DOMAIN                 0.001
 score HK_RANDOM_FROM                 0.001
 score HK_RANDOM_REPLYTO              0.998
-score HK_SCAM                        1.100
-score HOSTED_IMG_DIRECT_MX           1.584
+score HK_SCAM                        0.897
+score HOSTED_IMG_DIRECT_MX           2.116
 score HTML_OFF_PAGE                  0.001
-score HTML_SINGLET_MANY              0.973
+score HTML_SINGLET_MANY              0.001
 score HTML_TEXT_INVISIBLE_FONT       2.996
-score HTML_TEXT_INVISIBLE_STYLE      2.982
+score HTML_TEXT_INVISIBLE_STYLE      2.744
 score IMG_ONLY_FM_DOM_INFO           2.497
-score KB_FORGED_MOZ4                 2.963
-score KHOP_FAKE_EBAY                 0.473
-score KHOP_HELO_FCRDNS               0.275
-score LH_URI_DOM_IN_PATH             2.175
-score LIST_PRTL_SAME_USER            0.456
-score LONG_HEX_URI                   1.686
-score LONG_IMG_URI                   0.919
-score LONG_INVISIBLE_TEXT            1.849
+score KB_FORGED_MOZ4                 2.470
+score KHOP_FAKE_EBAY                 0.228
+score KHOP_HELO_FCRDNS               0.274
+score LH_URI_DOM_IN_PATH             2.331
+score LIST_PRTL_SAME_USER            0.978
+score LONG_HEX_URI                   1.580
+score LONG_IMG_URI                   1.738
+score LONG_INVISIBLE_TEXT            1.850
 score LOTS_OF_MONEY                  0.010
-score MANY_SPAN_IN_TEXT              1.435
-score MILLION_HUNDRED                0.536
-score MIMEOLE_DIRECT_TO_MX           0.001
+score MANY_SPAN_IN_TEXT              1.436
+score MILLION_HUNDRED                0.535
+score MIMEOLE_DIRECT_TO_MX           0.001 # force non-zero
 score MIME_NO_TEXT                   0.001
 score MIXED_ES                       2.696
-score MONEY_FORM_SHORT               1.513
-score MONEY_FRAUD_3                  0.870
-score MONEY_FRAUD_5                  0.488
-score MONEY_FRAUD_8                  0.771
+score MONEY_FORM_SHORT               0.001
+score MONEY_FRAUD_3                  0.873
+score MONEY_FRAUD_5                  1.036
+score MONEY_FRAUD_8                  1.983
 score MONEY_FROM_MISSP               1.997
-score MSM_PRIO_REPTO                 2.272
-score NICE_REPLY_A                   -0.238
-score NORDNS_LOW_CONTRAST            1.056
+score MSM_PRIO_REPTO                 2.168
+score NICE_REPLY_A                   -0.213
+score NORDNS_LOW_CONTRAST            1.132
 score NO_FM_NAME_IP_HOSTN            0.001
 score NSL_RCVD_FROM_USER             0.001
-score NSL_RCVD_HELO_USER             1.710
-score PDS_BTC_ID                     0.499
-score PDS_BTC_MSGID                  0.001 # force non-zero
-score PDS_EMPTYSUBJ_URISHRT          0.001
+score NSL_RCVD_HELO_USER             1.415
+score PDS_BTC_ID                     0.498
+score PDS_BTC_MSGID                  0.001
+score PDS_EMPTYSUBJ_URISHRT          0.161
 score PDS_FREEMAIL_REPLYTO_URISHRT   1.498
 score PDS_FRNOM_TODOM_NAKED_TO       1.498
-score PDS_FROM_2_EMAILS              1.997
+score PDS_FROM_2_EMAILS              2.097
 score PDS_FROM_NAME_TO_DOMAIN        0.998
 score PDS_NAKED_TO_NUMERO            1.997
-score PDS_SHORTFWD_URISHRT           1.223
-score PDS_TINYSUBJ_URISHRT           1.272
-score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 1.496
+score PDS_SHORTFWD_URISHRT           1.498
+score PDS_TINYSUBJ_URISHRT           1.270
+score PDS_TONAME_EQ_TOLOCAL_FREEM_FORGE 0.971
 score PDS_TONAME_EQ_TOLOCAL_HDRS_LCASE 1.997
 score PDS_TONAME_EQ_TOLOCAL_VSHORT   0.998
 score PDS_TO_EQ_FROM_NAME            0.001
 score PHP_ORIG_SCRIPT                2.497
 score PP_MIME_FAKE_ASCII_TEXT        0.998
-score RATWARE_NO_RDNS                1.354
+score RATWARE_NO_RDNS                1.668
 score RCVD_IN_MSPIKE_H2              -0.001
 score RISK_FREE                      2.896
-score SENDGRID_REDIR                 1.499
-score SENDGRID_REDIR_PHISH           3.454
-score SERGIO_SUBJECT_VIAGRA01        2.622
+score SENDGRID_REDIR                 1.498
+score SENDGRID_REDIR_PHISH           3.499
+score SERGIO_SUBJECT_VIAGRA01        2.628
 score SHORTENED_URL_SRC              2.996
-score SHORTENER_SHORT_IMG            0.287
-score SHORT_BODY_G_DRIVE_DYN         0.519
+score SHORTENER_SHORT_IMG            0.009
+score SHORT_BODY_G_DRIVE_DYN         0.545
 score SHORT_SHORTNER                 1.997
 score SINGLETS_LOW_CONTRAST          0.001
 score SPOOFED_FREEMAIL               1.997
-score SPOOFED_FREEMAIL_NO_RDNS       0.274
-score SPOOFED_FREEM_REPTO            1.975
-score SPOOFED_FREEM_REPTO_CHN        0.630
+score SPOOFED_FREEMAIL_NO_RDNS       0.527
+score SPOOFED_FREEM_REPTO            1.995
+score SPOOFED_FREEM_REPTO_CHN        2.477
 score STATIC_XPRIO_OLE               1.997
-score STOCK_LOW_CONTRAST             0.212
+score STOCK_LOW_CONTRAST             0.190
 score SUBJ_OBFU_PUNCT_FEW            0.748
 score SUBJ_OBFU_PUNCT_MANY           1.747
-score SUSP_UTF8_WORD_COMBO           0.462
+score SUSP_UTF8_WORD_COMBO           0.389
 score SUSP_UTF8_WORD_FROM            1.997
 score SUSP_UTF8_WORD_SUBJ            1.997
 score THIS_AD                        1.398
-score TONOM_EQ_TOLOC_SHRT_SHRTNER    1.315
-score TO_EQ_FM_DOM_HTML_IMG          0.632
-score TO_EQ_FM_DOM_HTML_ONLY         1.701
+score TONOM_EQ_TOLOC_SHRT_SHRTNER    1.266
+score TO_EQ_FM_DOM_HTML_IMG          0.267
+score TO_EQ_FM_DOM_HTML_ONLY         1.603
 score TO_EQ_FM_DOM_SPF_FAIL          0.001
-score TO_EQ_FM_HTML_ONLY             0.829
-score TO_EQ_FM_SPF_FAIL              1.824
-score TO_IN_SUBJ                     0.098
+score TO_EQ_FM_HTML_ONLY             0.772
+score TO_EQ_FM_SPF_FAIL              1.732
+score TO_IN_SUBJ                     0.099
 score TO_NO_BRKTS_FROM_MSSP          2.497
-score TO_NO_BRKTS_HTML_IMG           1.787
-score TO_NO_BRKTS_HTML_ONLY          1.998
-score TO_NO_BRKTS_MSFT               2.335
+score TO_NO_BRKTS_HTML_IMG           1.785
+score TO_NO_BRKTS_HTML_ONLY          1.997
+score TO_NO_BRKTS_MSFT               2.326
 score TO_NO_BRKTS_NORDNS_HTML        1.997
-score TVD_RCVD_SPACE_BRACKET         4.299
+score TVD_RCVD_SPACE_BRACKET         4.138
 score TVD_SPACE_ENCODED              0.001
 score TVD_SPACE_RATIO_MINFP          0.001
-score UPGRADE_MAILBOX                1.797
+score UPGRADE_MAILBOX                1.897
 score URI_DOTEDU                     0.001
 score URI_DOTEDU_ENTITY              2.996
-score URI_DOTEDU_LONG                0.001 # force non-zero
-score URI_GOOGLE_PROXY               0.375
+score URI_DOTEDU_LONG                0.001
+score URI_GOOGLE_PROXY               0.212
 score URI_IMG_WP_REDIR               2.996
-score URI_IN_URI_10                  1.290
-score URI_IN_URI_5                   2.557
-score URI_ONLY_MSGID_MALF            0.860
-score URI_PHISH                      3.151
+score URI_IN_URI_10                  2.342
+score URI_IN_URI_5                   2.211
+score URI_ONLY_MSGID_MALF            0.932
+score URI_PHISH                      3.095
 score URI_PHP_REDIR                  3.496
-score URI_TRY_3LD                    1.995
+score URI_TRY_3LD                    1.707
 score URI_WPADMIN                    2.696
-score URI_WP_DIRINDEX                2.820
+score URI_WP_DIRINDEX                2.666
 score URI_WP_HACKED                  3.496
-score URI_WP_HACKED_2                2.497
-score XPRIO_SHORT_SUBJ               1.445
+score URI_WP_HACKED_2                2.498
+score XPRIO_SHORT_SUBJ               1.444
 score AC_SPAMMY_URI_PATTERNS1        1.000
 score AC_SPAMMY_URI_PATTERNS10       1.000
 score AC_SPAMMY_URI_PATTERNS11       1.000

Modified: spamassassin/trunk/rulesrc/scores/stats-set0
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set0?rev=1882031&r1=1882030&r2=1882031&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set0 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set0 Sat Sep 26 03:25:10 2020
@@ -1,40 +1,40 @@
 ##### WITH NEW RULES AND SCORES #####
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 849841  50.787%  (99.480% of non-spam corpus)
-# Correctly spam:     667031  39.862%  (81.439% of spam corpus)
-# False positives:      4441  0.265%  (0.520% of nonspam, 140468 weighted)
-# False negatives:    152020  9.085%  (18.561% of spam, 387374 weighted)
-# Average score for spam:  8.5    nonspam: 0.5
-# Average for false-pos:   6.6  false-neg: 2.5
-# TOTAL:              1673333  100.00%
+# Correctly non-spam: 851368  52.911%  (99.595% of non-spam corpus)
+# Correctly spam:     607320  37.744%  (80.521% of spam corpus)
+# False positives:      3463  0.215%  (0.405% of nonspam, 107634 weighted)
+# False negatives:    146920  9.131%  (19.479% of spam, 371661 weighted)
+# Average score for spam:  8.7    nonspam: 0.5
+# Average for false-pos:   7.0  false-neg: 2.5
+# TOTAL:              1609071  100.00%
 
 Reading scores from "tmprules"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 106022  99.50%
-# Correctly spam:      83349  81.61%
-# False positives:       531  0.50%
-# False negatives:     18778  18.39%
-# TCR(l=50): 2.253067  SpamRecall: 81.613%  SpamPrec: 99.367%
+# Correctly non-spam: 106025  99.43%
+# Correctly spam:      75843  80.65%
+# False positives:       605  0.57%
+# False negatives:     18192  19.35%
+# TCR(l=50): 1.941187  SpamRecall: 80.654%  SpamPrec: 99.209%
 
 ##### WITHOUT NEW RULES AND SCORES #####
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 845709  99.00%
-# Correctly spam:     267015  32.60%
-# False positives:      8573  1.00%
-# False negatives:    552036  67.40%
-# TCR(l=50): 0.835182  SpamRecall: 32.601%  SpamPrec: 96.889%
+# Correctly non-spam: 846280  99.00%
+# Correctly spam:     246418  32.67%
+# False positives:      8551  1.00%
+# False negatives:    507822  67.33%
+# TCR(l=50): 0.806353  SpamRecall: 32.671%  SpamPrec: 96.646%
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 105489  99.00%
-# Correctly spam:      33230  32.54%
-# False positives:      1064  1.00%
-# False negatives:     68897  67.46%
-# TCR(l=50): 0.836442  SpamRecall: 32.538%  SpamPrec: 96.897%
+# Correctly non-spam: 105554  98.99%
+# Correctly spam:      30506  32.44%
+# False positives:      1076  1.01%
+# False negatives:     63529  67.56%
+# TCR(l=50): 0.801464  SpamRecall: 32.441%  SpamPrec: 96.593%

Modified: spamassassin/trunk/rulesrc/scores/stats-set1
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/scores/stats-set1?rev=1882031&r1=1882030&r2=1882031&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/scores/stats-set1 (original)
+++ spamassassin/trunk/rulesrc/scores/stats-set1 Sat Sep 26 03:25:10 2020
@@ -1,40 +1,40 @@
 ##### WITH NEW RULES AND SCORES #####
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 852983  45.003%  (99.667% of non-spam corpus)
-# Correctly spam:     974384  51.408%  (93.729% of spam corpus)
-# False positives:      2849  0.150%  (0.333% of nonspam, 269580 weighted)
-# False negatives:     65191  3.439%  (6.271% of spam, 134585 weighted)
+# Correctly non-spam: 853130  45.012%  (99.685% of non-spam corpus)
+# Correctly spam:     975154  51.450%  (93.810% of spam corpus)
+# False positives:      2699  0.142%  (0.315% of nonspam, 261186 weighted)
+# False negatives:     64342  3.395%  (6.190% of spam, 130938 weighted)
 # Average score for spam:  14.3    nonspam: -1.4
-# Average for false-pos:   7.8  false-neg: 2.1
-# TOTAL:              1895407  100.00%
+# Average for false-pos:   8.0  false-neg: 2.0
+# TOTAL:              1895325  100.00%
 
 Reading scores from "tmprules"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 106375  99.64%
-# Correctly spam:     121871  93.91%
-# False positives:       387  0.36%
-# False negatives:      7904  6.09%
-# TCR(l=50): 4.761686  SpamRecall: 93.909%  SpamPrec: 99.683%
+# Correctly non-spam: 106370  99.63%
+# Correctly spam:     121814  93.87%
+# False positives:       392  0.37%
+# False negatives:      7948  6.13%
+# TCR(l=50): 4.710396  SpamRecall: 93.875%  SpamPrec: 99.679%
 
 ##### WITHOUT NEW RULES AND SCORES #####
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 852518  99.61%
-# Correctly spam:     605835  58.28%
-# False positives:      3314  0.39%
-# False negatives:    433740  41.72%
-# TCR(l=50): 1.734244  SpamRecall: 58.277%  SpamPrec: 99.456%
+# Correctly non-spam: 852494  99.61%
+# Correctly spam:     605998  58.30%
+# False positives:      3335  0.39%
+# False negatives:    433498  41.70%
+# TCR(l=50): 1.731778  SpamRecall: 58.297%  SpamPrec: 99.453%
 Reading scores from "../rules-base"...
 Reading per-message hit stat logs and scores...
 
 # SUMMARY for threshold 5.0:
-# Correctly non-spam: 106336  99.60%
-# Correctly spam:      75626  58.27%
-# False positives:       426  0.40%
-# False negatives:     54149  41.73%
-# TCR(l=50): 1.720036  SpamRecall: 58.275%  SpamPrec: 99.440%
+# Correctly non-spam: 106365  99.63%
+# Correctly spam:      75532  58.21%
+# False positives:       397  0.37%
+# False negatives:     54230  41.79%
+# TCR(l=50): 1.751647  SpamRecall: 58.208%  SpamPrec: 99.477%