Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- from urllib.request import urlopen as uReq
- from bs4 import BeautifulSoup as soup
- import csv
- my_url = 'http://www.igobychad.com/test_table.html'
- uClient = uReq(my_url)
- page_html = uClient.read()
- uClient.close()
- page_soup = soup(page_html, "html.parser")
- page_soup.find("table", { "id" : "Emp_sum" })
- table = page_soup.find("table", { "id" : "Emp_sum" })
- for row in table.findAll("tr"):
- cells = row.findAll("td")
- headers = [header.text for header in table.find_all('th')]
- rows = []
- for row in table.find_all('tr'):
- rows.append([val.text.encode('utf8') for val in row.find_all('td')])
- with open('test1.csv', 'w') as f:
- writer = csv.writer(f)
- writer.writerow(headers)
- writer.writerows(row for row in rows if row)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement