You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by he...@apache.org on 2021/04/13 10:42:01 UTC
svn commit: r1888720 -
/spamassassin/trunk/lib/Mail/SpamAssassin/Plugin/Bayes.pm
Author: hege
Date: Tue Apr 13 10:42:01 2021
New Revision: 1888720
URL: http://svn.apache.org/viewvc?rev=1888720&view=rev
Log:
Fix previous fix
Modified:
spamassassin/trunk/lib/Mail/SpamAssassin/Plugin/Bayes.pm
Modified: spamassassin/trunk/lib/Mail/SpamAssassin/Plugin/Bayes.pm
URL: http://svn.apache.org/viewvc/spamassassin/trunk/lib/Mail/SpamAssassin/Plugin/Bayes.pm?rev=1888720&r1=1888719&r2=1888720&view=diff
==============================================================================
--- spamassassin/trunk/lib/Mail/SpamAssassin/Plugin/Bayes.pm (original)
+++ spamassassin/trunk/lib/Mail/SpamAssassin/Plugin/Bayes.pm Tue Apr 13 10:42:01 2021
@@ -1253,7 +1253,7 @@ sub _tokenize_line {
# cleared, even if the source string has perl characters semantics !!!
# Is this really still desirable?
- foreach my $token (split) {
+TOKEN: foreach my $token (split) {
$token =~ s/^[-'"\.,]+//; # trim non-alphanum chars at start or end
$token =~ s/[-'"\.,]+$//; # so we don't get loads of '"foo' tokens
@@ -1279,7 +1279,7 @@ sub _tokenize_line {
if ($token =~ /^$self->{bayes_stopword}{$lang}$/i) {
dbg("bayes: skipped token '$token' because it's in stopword list for language '$lang'");
$self->{stopword_cache}{$token} = 1;
- next;
+ next TOKEN;
}
}
$self->{stopword_cache}{$token} = 0;