Advertisement
Guest User

Untitled

a guest
Oct 13th, 2016
144
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.50 KB | None | 0 0
  1. import urllib, http.cookiejar, requests
  2. from bs4 import BeautifulSoup
  3.  
  4. url = "https://www.cgpbooks.co.uk/bookspace/BRAR72DF/assets/mobile/pages/page{}{}_i2.png"
  5. filename = "C:\\twmp\\CGP 1 pg{}.png"
  6.  
  7. username = 'redacted' #you'll have to find your own login
  8. password = 'redacted'
  9. token = ""
  10.  
  11. with requests.Session() as s:
  12. r = s.get('https://account.cgpbooks.co.uk/Account/SignIn')
  13. soup = BeautifulSoup(r.text, "html.parser")
  14.  
  15. for i in soup.findAll(attrs={"name":"__RequestVerificationToken"}):
  16. if i['name'] == '__RequestVerificationToken':
  17. print(i)
  18. token = i.get('value')
  19. print(i.get('value'))
  20. signinurl = "https://account.cgpbooks.co.uk/Account/SignIn?stsctxret=%2FIssue%3Fwa%3Dwsignin1.0%26wtrealm%3Durn%253Acgpbooks%253Aportal%26wctx%3Drm%253D0%2526id%253Dpassive%2526ru%253D%25252f%26wct%3D2016-10-08T17%253A08%253A47Z&stsctxrealm=urn%3Acgpbooks%3Aportal&stsctxid=passive"
  21.  
  22. payload = {
  23. '__RequestVerificationToken': token,
  24. 'UserName': username,
  25. 'Password': password,
  26. 'Remember': 'false'
  27. }
  28.  
  29.  
  30. p = s.post(signinurl, data=payload)
  31.  
  32. #uthorised request.
  33. r = s.get('https://www.cgpbooks.co.uk/pages/bookspace.asp')
  34. print(r.text)
  35.  
  36.  
  37. #print('cookies', requests.utils.dict_from_cookiejar(s.cookies))
  38.  
  39. i = 1
  40. while True:
  41. urllib.request.urlretrieve(url.format("0"*(-len(str(i))+4),i), filename.format(i))
  42. print("Saved page {}".format(i))
  43. i += 1
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement