Advertisement
Guest User

Untitled

a guest
Aug 24th, 2019
80
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.07 KB | None | 0 0
  1. from bs4 import BeautifulSoup
  2. import requests
  3.  
  4. output = open('bob.txt','a+', encoding='utf-8')
  5. headers = {
  6.     "Cookie": "intercom-id-ynnn5d6q=19c62e81-30f6-4610-8919-1401a97b54f9; __cfduid=dc642a4610cc9527d0c9d234d04cb34751545244738; _ga=GA1.2.1288742159.1553910371; site24x7rumID=3269752668489886.1566647311221; __zlcmid=sTiGOr2yM1lpij; site24x7RUMSnapshotId=1558962251056.false; EduSiteCookie=bf6c659f-af11-4ec4-8fc0-ac377d8e4abb"
  7. }
  8.  
  9. url, page = "https://open.kattis.com/problems?page=", 0
  10. print("Reading page: ", flush=True, end='')
  11. while True:
  12.     req = requests.get(url + str(page), headers=headers)
  13.     soup = BeautifulSoup(req.text, 'html.parser')
  14.     print(f"{page}..", flush=True,end='')
  15.     results = 0
  16.     page += 1
  17.     for row in soup.find('table').find('tbody').find_all('tr'):
  18.         results += 1
  19.         vals, cl = row.find_all('td'), row.get('class')
  20.         output.write(','.join([vals[x].text for x in range(9)]) + ',' + (str(cl[1]) if len(cl) > 1 else 'unsolved') + '\n')
  21.     if results == 0:
  22.         break
  23. print('done')
  24. output.flush()
  25. output.close()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement