You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by mm...@apache.org on 2015/03/11 01:37:46 UTC
svn commit: r1665746 - /spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm
Author: mmartinec
Date: Wed Mar 11 00:37:45 2015
New Revision: 1665746
URL: http://svn.apache.org/r1665746
Log:
Bug 6751: Certain Character Sets can use alternate characters - add ONE DOT LEADER (U+2024) for good measure
Modified:
spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm
Modified: spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm
URL: http://svn.apache.org/viewvc/spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm?rev=1665746&r1=1665745&r2=1665746&view=diff
==============================================================================
--- spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm (original)
+++ spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm Wed Mar 11 00:37:45 2015
@@ -1321,8 +1321,9 @@ sub uri_list_canonicalize {
# [...] Only the IDEOGRAPHIC FULL STOP character (U+3002) is added in
# this mapping because the authors have not fully investigated [...]
# Adding also 'SMALL FULL STOP' (U+FE52) as seen in the wild.
+ # Parhaps also the 'ONE DOT LEADER' (U+2024).
if ($host =~ s{(?: \xE3\x80\x82 | \xEF\xBC\x8E | \xEF\xBD\xA1 |
- \xEF\xB9\x92 )}{.}xgs) {
+ \xEF\xB9\x92 | \xE2\x80\xA4 )}{.}xgs) {
push(@nuris, join ('', $proto, $host, $rest));
}