Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import requests
- import json
- from bs4 import BeautifulSoup
- url = "https://www.dba.dk/computer-og-spillekonsoller/hardware-og-software/?soegfra=2400&radius=10"
- headers = {
- "Host": "www.dba.dk",
- "User-Agent": "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:67.0) Gecko/20100101 Firefox/67.0",
- "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8",
- "Accept-Language": "en-US,en;q=0.5",
- "Accept-Encoding": "gzip, deflate, br",
- "Connection": "keep-alive",
- "Cookie": "dbatracker=id=931a28f6-7d9f-4efe-a7ce-232d8cb4592d; marketing-guide-persisted-values=%7B%7D; GdprNoticeCount=2; cto_lwid=04bc7fa3-add4-475c-9662-8e63c8b70927; _ga=GA1.2.1391023613.1560708499; _gid=GA1.2.1058433959.1560708499; __gads=ID=f31622ba6fe7d080:T=1560708501:S=ALNI_MbCU6FlDgYiRQKsWjHFAp4wrOa4-Q; ki_t=1560708504443%3B1560708504443%3B1560709090533%3B1%3B2; ki_r=; dbasession=id=fc1ca56d-a8e0-44ab-94c1-edb272ce82ae; __RequestVerificationToken=GqoEuoDmUCZZGjvbkH-jmzZHy6pQw-xkHtYgHzEtaL-gevCFJC0V0BeYjc378kmjGyFNSSTFUNsFX09vLeZxTKPNNWVCEbh_zFEYWFZXK09uEawUtGEq5XMuU_ViqRNaXD78ig2; _gat=1",
- "Cache-Control": "max-age=0",
- }
- result = requests.get(url, headers=headers)
- print(result.status_code)
- c = (result.content)
- soup = BeautifulSoup(c, "lxml")
- listings = soup.find_all("tr", "dbaListing")
- for listing in listings:
- contents = listing.find("script", {"type": "application/ld+json"}).text
- try:
- content = json.loads(contents)
- listingurl = content["url"]
- print(listingurl)
- #productpage = requests.get(listingurl, headers=headers).content()
- except:
- content = ""
- # try:
- # print(content["price"] + content["Currency"])
- # except:
- # print("- -")
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement