Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import getpass
- import urllib
- import urllib.request
- from urllib.request import Request, urlopen
- import string
- from bs4 import BeautifulSoup
- #html = urllib.request.urlopen("http://directory.io/10", headers={'User-Agent': 'Mozilla/5.0'})
- #print(html.read())
- req = Request('http://directory.io/', headers={'User-Agent': 'Mozilla/5.0'})
- webpage = urlopen(req).read()
- webpage.decode().split('https://blockchain.info/address/', 34)
- #print(webpage)
- soup = BeautifulSoup(webpage, 'html.parser')
- #print(soup.prettify())
- tab = soup.find_all('a')
- liste = []
- count = 0
- for i in tab:
- if ((count % 3 == 0) and (soup.find_all('a')[count].get_text()).strip() != "previous"):
- liste.append((soup.find_all('a')[count].get_text()).strip())
- #print(soup.find_all('a')[count].get_text())
- count = count+1
- for j in liste:
- print(j)
- #print(soup.find_all('a')[3].get_text())
- #print(soup.find_all('a')[6].get_text())
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement