You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by jh...@apache.org on 2020/05/08 00:10:45 UTC

svn commit: r1877489 - /spamassassin/trunk/rulesrc/sandbox/jhardin/20_misc_testing.cf

Author: jhardin
Date: Fri May  8 00:10:45 2020
New Revision: 1877489

URL: http://svn.apache.org/viewvc?rev=1877489&view=rev
Log:
four-byte-UTF8 tuning

Modified:
    spamassassin/trunk/rulesrc/sandbox/jhardin/20_misc_testing.cf

Modified: spamassassin/trunk/rulesrc/sandbox/jhardin/20_misc_testing.cf
URL: http://svn.apache.org/viewvc/spamassassin/trunk/rulesrc/sandbox/jhardin/20_misc_testing.cf?rev=1877489&r1=1877488&r2=1877489&view=diff
==============================================================================
--- spamassassin/trunk/rulesrc/sandbox/jhardin/20_misc_testing.cf (original)
+++ spamassassin/trunk/rulesrc/sandbox/jhardin/20_misc_testing.cf Fri May  8 00:10:45 2020
@@ -2977,3 +2977,11 @@ body       WE_PAID                     /
 body       MAKE_XTRA_DOLLAR            /\bmake an extra dollar\b/i
 body       BONUS_LAST_DAY              /\b(?:last|final) day of the (?:\$\d+ |\d+ dollars? )?bonus offer(?:ing)?\b/i
 
+body       __4BYTE_UTF8_WORD           /(?:\xf0\x9d[\x90-\x9f][\x80-\xbf]){3,10}/
+tflags     __4BYTE_UTF8_WORD           multiple, maxhits=10
+meta       SUSP_UTF8_WORD_MANY         __4BYTE_UTF8_WORD > 9
+describe   SUSP_UTF8_WORD_MANY         Many words using only suspicious UTF-8 characters
+score      SUSP_UTF8_WORD_MANY         3.000	# limit
+
+
+