Advertisement
Guest User

Untitled

a guest
Jul 24th, 2017
48
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.74 KB | None | 0 0
  1. from urllib.request import urlopen as uReq
  2. from bs4 import BeautifulSoup as soup
  3. import csv
  4. my_url = 'http://www.igobychad.com/test_table.html'
  5. uClient = uReq(my_url)
  6. page_html = uClient.read()
  7. uClient.close()
  8. page_soup = soup(page_html, "html.parser")
  9. page_soup.find("table", { "id" : "Emp_sum" })
  10. table = page_soup.find("table", { "id" : "Emp_sum" })
  11. for row in table.findAll("tr"):
  12.    cells = row.findAll("td")
  13. headers = [header.text for header in table.find_all('th')]
  14. rows = []
  15. for row in table.find_all('tr'):
  16.     rows.append([val.text.encode('utf8') for val in row.find_all('td')])
  17. with open('test1.csv', 'w') as f:
  18.        writer = csv.writer(f)
  19.        writer.writerow(headers)
  20.        writer.writerows(row for row in rows if row)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement