Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- from lxml import html
- from lxml.cssselect import CSSSelector
- from lxml import etree
- import requests
- import string
- import os
- from selenium import webdriver
- from selenium.webdriver.chrome.options import Options
- import time
- from selenium.webdriver.common.keys import Keys
- from selenium.webdriver.common.action_chains import ActionChains
- import selenium.webdriver.support.ui as ui
- import random
- import statistics as stat
- import math
- import pprint
- import xlsxwriter
- from io import StringIO, BytesIO
- from bs4 import BeautifulSoup
- import re
- chrome_options = Options()
- executable_path = "C:\Python27\Scripts\chromedriver.exe"
- os.environ["webdriver.chrome.driver"] = executable_path
- driver = webdriver.Chrome(executable_path=executable_path, chrome_options=chrome_options)
- driver.get('http://kenpom.com/')
- #login-------------
- username = driver.find_element_by_xpath('//*[@id="login"]/input[1]')
- username.send_keys("petergrimson@gmail.com")
- password = driver.find_element_by_xpath('//*[@id="login"]/input[2]')
- password.send_keys("Nalgene1")
- login = driver.find_element_by_xpath('//*[@id="login"]/input[3]')
- login.click()
- driver.get('http://kenpom.com/fanmatch.php?d=2017-02-25')
- html = driver.page_source
- soup = BeautifulSoup(html, 'lxml')
- table = soup.find('tbody')
- rows = table.find_all('tr')
- for row in rows:
- columns = row.find_all('td')
- print (columns)
- '''
- rowslist = []
- for rows in table.find_all('tr'):
- rowslist.append(rows.text)
- for item in rowslist[:]:
- if not 'OT)' in item:
- rowslist.remove(item)
- '''
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement