Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import requests
- from lxml import html
- from bs4 import BeautifulSoup
- USERNAME = "lmcrory"
- PASSWORD = "xxxxx"
- LOGIN_URL = "http://share.baner.com/share/page?pt=login"
- URL = "http://share.baner.com/share/page/user/lmcrory/dashboard"
- def listLinks():
- session_requests = requests.session()
- # Get login csrf token
- result = session_requests.get(LOGIN_URL)
- tree = html.fromstring(result.text)
- print(tree)
- # authenticity_token = list(set(tree.xpath("//input[@name='csrfmiddlewaretoken']/@value")))[0]
- authenticity_token = list(set(tree.xpath("//input[@name='csrfmiddlewaretoken']/@value")))
- # Create payload
- payload = {
- "username": USERNAME,
- "password": PASSWORD,
- # "csrfmiddlewaretoken": authenticity_token
- }
- # Perform login
- result = session_requests.post(LOGIN_URL, data = payload, headers = dict(referer = LOGIN_URL))
- # Scrape url
- result = session_requests.get(URL, headers = dict(referer = URL))
- content= result.content
- print(content)
- data = result.text()
- soup = BeautifulSoup(data)
- for link in soup.find_all('a'):
- print(link.get('href'))
- tree = html.fromstring(result.content)
- bucket_names = tree.xpath("//div[@class='repo-list--repo']/a/text()")
- print(bucket_names)
- listLinks()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement