Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import requests
- from bs4 import BeautifulSoup
- url = 'https://pixabay.com/'
- target_url = 'https://pixabay.com/images/search/office/'
- headers = {
- 'User-Agent': 'Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/85.0.4183.83 Safari/537.36',
- "Accept-Language": "en-US;q=0.7,en;q=0.3",
- "Cache-Control": "no-cache",
- }
- with requests.Session() as s:
- s.headers.update(headers)
- r = s.get(url)
- print(r.status_code)
- r = s.get(target_url)
- print(r.status_code)
- results = []
- soup = BeautifulSoup(r.text, "lxml")
- for item in soup.select(".search_results a > img[src]"):
- src = item.get("src")
- if src is not None and 'blank.gif' not in src:
- print('src:', src)
- results.append(src)
- else:
- src = item.get("data-lazy")
- print('data-lazy:', src)
- results.append(src)
- print('len:', len(results))
Add Comment
Please, Sign In to add comment