Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- # -*- coding: utf-8 -*-
- import urllib2
- import re
- emails = []
- opener = urllib2.build_opener()
- opener.addheaders = [('User-agent', 'Mozilla/5.0\'; DROP TABLE users')]
- i = 7364866
- limit = i - 15000
- while i >= limit:
- try:
- f = opener.open('http://zakupki.gov.ru/pgz/printForm?type=NOTIFICATION&id=' + str(i))
- data = f.read()
- emails += re.findall(r'([-._\w]+@(?:mail|inbox|bk|list)\.ru)', data, re.I)
- except:
- pass
- print len(emails)
- print i - limit
- i -= 1
- unique = set(emails)
- emails = list(unique)
- open('emails.txt', 'w').write('\n'.join(emails))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement