You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@community.apache.org by se...@apache.org on 2016/04/11 00:11:53 UTC
svn commit: r1738472 -
/comdev/reporter.apache.org/trunk/scripts/mailglomper2.py
Author: sebb
Date: Sun Apr 10 22:11:53 2016
New Revision: 1738472
URL: http://svn.apache.org/viewvc?rev=1738472&view=rev
Log:
Start reducing the lists we look at
Modified:
comdev/reporter.apache.org/trunk/scripts/mailglomper2.py
Modified: comdev/reporter.apache.org/trunk/scripts/mailglomper2.py
URL: http://svn.apache.org/viewvc/comdev/reporter.apache.org/trunk/scripts/mailglomper2.py?rev=1738472&r1=1738471&r2=1738472&view=diff
==============================================================================
--- comdev/reporter.apache.org/trunk/scripts/mailglomper2.py (original)
+++ comdev/reporter.apache.org/trunk/scripts/mailglomper2.py Sun Apr 10 22:11:53 2016
@@ -191,6 +191,10 @@ signal.signal(signal.SIGTERM, handle)
lastCheckpoint = time.time() # when output files were last saved
for mlist in re.finditer(r"<a href='([-a-z0-9]+)/'", data):
ml = mlist.group(1)
+ # TODO reject all but current projects, meanwhile we don't want these:
+ if ml.startswith('www-'):
+ continue # don't want ASF mailing lists
+
tsprint("Processing: " + ml)
start = time.time()
mls[ml] = {}