[Blends-commit] r3105 - /blends/trunk/team_analysis_tools/get-archive-pages

tille at users.alioth.debian.org tille at users.alioth.debian.org
Thu Jan 5 22:13:32 UTC 2012


Author: tille
Date: Thu Jan  5 22:13:31 2012
New Revision: 3105

URL: http://svn.debian.org/wsvn/blends/?sc=1&rev=3105
Log:
Handle spammy subjects

Modified:
    blends/trunk/team_analysis_tools/get-archive-pages

Modified: blends/trunk/team_analysis_tools/get-archive-pages
URL: http://svn.debian.org/wsvn/blends/blends/trunk/team_analysis_tools/get-archive-pages?rev=3105&op=diff
==============================================================================
--- blends/trunk/team_analysis_tools/get-archive-pages (original)
+++ blends/trunk/team_analysis_tools/get-archive-pages Thu Jan  5 22:13:31 2012
@@ -333,11 +333,20 @@
 					last;
 				    }
 				}
+			        my $spamsubject;
+			        my $numspamsubjects = 0;
+				foreach $spamsubject (@SPAMSUBJECTS) {
+				    if ( $subject =~ /$spamauthor/ ) {
+					$numspamsubjects = 1;
+					last;
+				    }
+				}
+				
 				# authors with strange names also provide spam
 			        my $countstrangechars = 0;
 			        while ($author =~ /;\s*&#x[\dA-F][\dA-F][\dA-F]/g) { $countstrangechars++ }
 			        
-				if ( $author =~ /^[-&#x\d;\sA-F\?:,]+$/ || $countstrangechars > 7 || $numspamauthors > 0 ) {
+				if ( $author =~ /^[-&#x\d;\sA-F\?:,]+$/ || $countstrangechars > 7 || $numspamauthors > 0 || $numspamsubjects > 0 ) {
                                     # $author =~ /info/i ) { # never had a non-spam message from an author whos name contains info
                                     # This is not reliable: We have for instance
                                     #   http://lists.debian.org/debian-security/2003/07/msg00054.html




More information about the Blends-commit mailing list