Guest User

FF Scraper

a guest
Aug 31st, 2017
38
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.02 KB | None | 0 0
  1. import requests
  2. from bs4 import BeautifulSoup
  3. import pandas as pd
  4. import os
  5.  
  6. offpos = ['WR', 'QB', 'RB', 'TE']
  7. columns = ['PLAYER', 'TEAM', 'PLAYS', 'POINTS', 'GAMES_PLAYED', 'POINTS_PER_GAME', 'RUN', 'RUSH_YARDS', 'RUSING_TD', 'PASS', 'COMPLETIONS', 'PASS_YDS', 'PASS_TD', 'FUM', 'INT']
  8. sfmat = {'standard' : '5', 'ppr' : '2'}
  9.  
  10. def offassemble(year):
  11.     if not os.path.exists(year):
  12.         os.makedirs(year)
  13.        
  14.        
  15.     for fmat in sfmat.items():
  16.         for pos in offpos:
  17.             url = 'http://www.thehuddle.com/stats/' + year + '/plays_std.php?ccs=' + fmat[1] + '&pos=' + pos
  18.             df=pd.read_html(url, flavor=['bs4'])
  19.             df=df[0]
  20.             del df['CMP']
  21.             del df['PYDS']
  22.             del df['PTD']
  23.             del df['FUM']
  24.             del df['INT']
  25.             df.columns = columns
  26.             df.to_pickle(year + '/' + fmat[0] + '_' + pos + '.pkl')
  27.  
  28. def main():
  29.     year = input('Year?')
  30.     offassemble(year)
  31.    
  32.        
  33.  
  34.  
  35. if __name__ == '__main__':
  36.     main()
Add Comment
Please, Sign In to add comment