You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@community.apache.org by se...@apache.org on 2016/04/11 00:11:53 UTC

svn commit: r1738472 - /comdev/reporter.apache.org/trunk/scripts/mailglomper2.py

Author: sebb
Date: Sun Apr 10 22:11:53 2016
New Revision: 1738472

URL: http://svn.apache.org/viewvc?rev=1738472&view=rev
Log:
Start reducing the lists we look at

Modified:
    comdev/reporter.apache.org/trunk/scripts/mailglomper2.py

Modified: comdev/reporter.apache.org/trunk/scripts/mailglomper2.py
URL: http://svn.apache.org/viewvc/comdev/reporter.apache.org/trunk/scripts/mailglomper2.py?rev=1738472&r1=1738471&r2=1738472&view=diff
==============================================================================
--- comdev/reporter.apache.org/trunk/scripts/mailglomper2.py (original)
+++ comdev/reporter.apache.org/trunk/scripts/mailglomper2.py Sun Apr 10 22:11:53 2016
@@ -191,6 +191,10 @@ signal.signal(signal.SIGTERM, handle)
 lastCheckpoint = time.time() # when output files were last saved
 for mlist in re.finditer(r"<a href='([-a-z0-9]+)/'", data):
     ml = mlist.group(1)
+    # TODO reject all but current projects, meanwhile we don't want these:
+    if ml.startswith('www-'):
+        continue # don't want ASF mailing lists
+    
     tsprint("Processing: " + ml)
     start = time.time()
     mls[ml] = {}