Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import requests
- import lxml.html
- import cssselect
- import csv
- req = requests.get('http://en.wikipedia.org/wiki/List_of_AZA_member_zoos_and_aquaria')
- root = lxml.html.fromstring(req.text)
- b = root.cssselect('table:first-of-type tr')
- c = []
- urls = []
- for row in b[1:]:
- cells = row.cssselect('tr')
- c.append(cells[0].text_content().strip())
- sites = row.cssselect('a href')
- links = cells[0].cssselect('a')
- urls.append(links[3].get('href'))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement