You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spamassassin.apache.org by mm...@apache.org on 2015/03/11 01:37:46 UTC

svn commit: r1665746 - /spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm

Author: mmartinec
Date: Wed Mar 11 00:37:45 2015
New Revision: 1665746

URL: http://svn.apache.org/r1665746
Log:
Bug 6751: Certain Character Sets can use alternate characters - add ONE DOT LEADER (U+2024) for good measure

Modified:
    spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm

Modified: spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm
URL: http://svn.apache.org/viewvc/spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm?rev=1665746&r1=1665745&r2=1665746&view=diff
==============================================================================
--- spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm (original)
+++ spamassassin/trunk/lib/Mail/SpamAssassin/Util.pm Wed Mar 11 00:37:45 2015
@@ -1321,8 +1321,9 @@ sub uri_list_canonicalize {
       #   [...] Only the IDEOGRAPHIC FULL STOP character (U+3002) is added in
       #   this mapping because the authors have not fully investigated [...]
       # Adding also 'SMALL FULL STOP' (U+FE52) as seen in the wild.
+      # Parhaps also the 'ONE DOT LEADER' (U+2024).
       if ($host =~ s{(?: \xE3\x80\x82 | \xEF\xBC\x8E | \xEF\xBD\xA1 |
-                         \xEF\xB9\x92 )}{.}xgs) {
+                         \xEF\xB9\x92 | \xE2\x80\xA4 )}{.}xgs) {
         push(@nuris, join ('', $proto, $host, $rest));
       }