Advertisement
Guest User

Untitled

a guest
May 22nd, 2017
51
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.91 KB | None | 0 0
  1. import getpass
  2. import urllib
  3. import urllib.request
  4. from urllib.request import Request, urlopen
  5. import string
  6. from bs4 import BeautifulSoup
  7.  
  8. #html = urllib.request.urlopen("http://directory.io/10", headers={'User-Agent': 'Mozilla/5.0'})
  9. #print(html.read())
  10.  
  11. req = Request('http://directory.io/', headers={'User-Agent': 'Mozilla/5.0'})
  12. webpage = urlopen(req).read()
  13. webpage.decode().split('https://blockchain.info/address/', 34)
  14. #print(webpage)
  15.  
  16. soup = BeautifulSoup(webpage, 'html.parser')
  17. #print(soup.prettify())
  18.  
  19. tab = soup.find_all('a')
  20. liste = []
  21. count = 0
  22.  
  23. for i in tab:
  24.     if ((count % 3 == 0) and (soup.find_all('a')[count].get_text()).strip() != "previous"):
  25.         liste.append((soup.find_all('a')[count].get_text()).strip())
  26.         #print(soup.find_all('a')[count].get_text())
  27.     count = count+1
  28.  
  29. for j in liste:
  30.     print(j)
  31. #print(soup.find_all('a')[3].get_text())
  32. #print(soup.find_all('a')[6].get_text())
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement