My favorites | Sign in
Project Home Wiki Issues Source
Checkout   Browse   Changes    
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
#!/bin/env python
# -*- coding: utf8 -*-

import os
import sys
import mailbox
import re
import urllib

def run():
get_href = re.compile("http://[^\s\"\"=<>]*")
mbox = mailbox.Maildir(os.path.expanduser("~/Maildir"),
factory=mailbox.MaildirMessage) # use newer email.message.Message
junk = mbox.get_folder("Junk.Both")
def get_body(message):
if message.is_multipart():
for p in message.get_payload():
for b in get_body(p):
yield b
else:
yield message.get_payload(decode=True)
for message in junk:
for body in get_body(message):
uris = set(get_href.findall(body))
for uri in uris:
print uri

if __name__ == "__main__":
if len(sys.argv) > 1:
print "SpamFight, generate traffic against spammed urls!"
print "Usage:"
print " python %s | xargs -n1 -P5 curl > /dev/null" % sys.argv[0]
else:
run()

Change log

r263 by matteo.bertini on Sep 22, 2008   Diff
Add parallel xargs run
Go to: 
Project members, sign in to write a code review

Older revisions

r262 by matteo.bertini on Sep 22, 2008   Diff
Maildir parser for spammed uri
All revisions of this file

File info

Size: 1002 bytes, 34 lines

File properties

svn:eol-style
native
Powered by Google Project Hosting