Advertisement
Guest User

Untitled

a guest
Jun 16th, 2019
66
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.72 KB | None | 0 0
  1. import requests
  2. import json
  3. from bs4 import BeautifulSoup
  4. url = "https://www.dba.dk/computer-og-spillekonsoller/hardware-og-software/?soegfra=2400&radius=10"
  5. headers = {
  6. "Host": "www.dba.dk",
  7. "User-Agent": "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:67.0) Gecko/20100101 Firefox/67.0",
  8. "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8",
  9. "Accept-Language": "en-US,en;q=0.5",
  10. "Accept-Encoding": "gzip, deflate, br",
  11. "Connection": "keep-alive",
  12. "Cookie": "dbatracker=id=931a28f6-7d9f-4efe-a7ce-232d8cb4592d; marketing-guide-persisted-values=%7B%7D; GdprNoticeCount=2; cto_lwid=04bc7fa3-add4-475c-9662-8e63c8b70927; _ga=GA1.2.1391023613.1560708499; _gid=GA1.2.1058433959.1560708499; __gads=ID=f31622ba6fe7d080:T=1560708501:S=ALNI_MbCU6FlDgYiRQKsWjHFAp4wrOa4-Q; ki_t=1560708504443%3B1560708504443%3B1560709090533%3B1%3B2; ki_r=; dbasession=id=fc1ca56d-a8e0-44ab-94c1-edb272ce82ae; __RequestVerificationToken=GqoEuoDmUCZZGjvbkH-jmzZHy6pQw-xkHtYgHzEtaL-gevCFJC0V0BeYjc378kmjGyFNSSTFUNsFX09vLeZxTKPNNWVCEbh_zFEYWFZXK09uEawUtGEq5XMuU_ViqRNaXD78ig2; _gat=1",
  13. "Cache-Control": "max-age=0",
  14. }
  15. result = requests.get(url, headers=headers)
  16.  
  17. print(result.status_code)
  18. c = (result.content)
  19. soup = BeautifulSoup(c, "lxml")
  20. listings = soup.find_all("tr", "dbaListing")
  21. for listing in listings:
  22. contents = listing.find("script", {"type": "application/ld+json"}).text
  23. try:
  24. content = json.loads(contents)
  25. listingurl = content["url"]
  26. print(listingurl)
  27. #productpage = requests.get(listingurl, headers=headers).content()
  28. except:
  29. content = ""
  30. # try:
  31. # print(content["price"] + content["Currency"])
  32. # except:
  33. # print("- -")
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement