Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- #!/usr/bin/python
- # -*- coding: utf-8 -*-
- from bs4 import BeautifulSoup
- import re
- import urllib2
- unique = []
- number = 1
- while number < 10000:
- try:
- url = 'https://portal.eks.sk/SpravaDodavatelov/VerejnyProfilDodavatela/Detail/' + str(number)
- page = urllib2.urlopen(url)
- soup = BeautifulSoup(page.read())
- all = soup.select("p")
- match = re.search(r"([\w.-]+)@([\w.-]+)", str(all))
- email = str(match.group())
- print number, " ", email
- unique.append(email)
- number += 1
- except:
- print "Error on site"
- number += 1
- print unique
- file = open('EKS.txt', 'a')
- file.write(str(unique))
- file.close()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement