Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import urllib, http.cookiejar, requests
- from bs4 import BeautifulSoup
- url = "https://www.cgpbooks.co.uk/bookspace/BRAR72DF/assets/mobile/pages/page{}{}_i2.png"
- filename = "C:\\twmp\\CGP 1 pg{}.png"
- username = 'redacted' #you'll have to find your own login
- password = 'redacted'
- token = ""
- with requests.Session() as s:
- r = s.get('https://account.cgpbooks.co.uk/Account/SignIn')
- soup = BeautifulSoup(r.text, "html.parser")
- for i in soup.findAll(attrs={"name":"__RequestVerificationToken"}):
- if i['name'] == '__RequestVerificationToken':
- print(i)
- token = i.get('value')
- print(i.get('value'))
- signinurl = "https://account.cgpbooks.co.uk/Account/SignIn?stsctxret=%2FIssue%3Fwa%3Dwsignin1.0%26wtrealm%3Durn%253Acgpbooks%253Aportal%26wctx%3Drm%253D0%2526id%253Dpassive%2526ru%253D%25252f%26wct%3D2016-10-08T17%253A08%253A47Z&stsctxrealm=urn%3Acgpbooks%3Aportal&stsctxid=passive"
- payload = {
- '__RequestVerificationToken': token,
- 'UserName': username,
- 'Password': password,
- 'Remember': 'false'
- }
- p = s.post(signinurl, data=payload)
- #uthorised request.
- r = s.get('https://www.cgpbooks.co.uk/pages/bookspace.asp')
- print(r.text)
- #print('cookies', requests.utils.dict_from_cookiejar(s.cookies))
- i = 1
- while True:
- urllib.request.urlretrieve(url.format("0"*(-len(str(i))+4),i), filename.format(i))
- print("Saved page {}".format(i))
- i += 1
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement