Advertisement
Guest User

Untitled

a guest
Mar 18th, 2019
75
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 2.15 KB | None | 0 0
  1. from urllib.request import urlopen as uReq
  2. from bs4 import BeautifulSoup as soup
  3. # import csv
  4.  
  5. # csv_file = open('travelplanet_scrape.csv', 'w', newline = '')
  6. # csv_writer = csv.writer(csv_file, dialect='excel')
  7. # csv_writer.writerow(['nazwa', 'procenty', 'cena', 'ocena', 'gwiazdek', 'kraj', 'region', 'url_oferta'])
  8.  
  9.  
  10. for i in range(1, 3):
  11.     print("strona: " + str(i))
  12.    
  13.     my_url = 'https://www.travelplanet.pl/wczasy/oferty/' + str(i) + '/?wylot=17.03.2019&przylot=07.04.2019&osoby=2&czas=0:100&wyzywienie=1&ocena=3&dojazd=F&sortowanie=1&kolejnosc=up&limit=25'
  14.    
  15.  
  16.  
  17.     uClient = uReq(my_url)
  18.  
  19.     page_html = uClient.read()
  20.     uClient.close()
  21.  
  22.     page_soup = soup(page_html, "html.parser")
  23.  
  24.     oferty = page_soup.findAll("section", {"class": "offer-item offer-item-with-slider"})
  25.     oferta = oferty[0]
  26.  
  27.     for oferta in oferty:
  28.  
  29.         nazwa = oferta.find("a", {"class": "oi-h-link"})['title']
  30.         cena = oferta.find("span", {"class":"pb-hp-onepreson"}).text
  31.         oferta_procenty = oferta.find("span", {"class": "oi-ff-pd-discount-precentage-label"})
  32.  
  33.         if oferta_procenty != None:
  34.             procenty = oferta.find("span", {"class": "oi-ff-pd-discount-precentage-label"}).text
  35.  
  36.                 # if procenty != None:
  37.                 #    pass
  38.                 #     cena = oferta.find("span", {"class":"pb-hp-onepreson"}).text
  39.                    
  40.                 #     url_oferta1 = oferta.find("a", {"class": "imgCont wt"})['href']
  41.                 #     url_oferta = f'https://www.wakacje.pl{url_oferta1}'
  42.  
  43.                 #     kraj1 = oferta.find("span", {"class": "country"}).text
  44.                 #     kraj = kraj1.split('/')[0]
  45.                 #     region = kraj1.split('/')[1]
  46.  
  47.                 #     ocena = oferta.find("b", {"class": "rating"}).text
  48.                 #     gwiazdek = oferta.find("span", {"class": "sprite hotelCategory-s"})['data-stars']
  49.  
  50.                 #     csv_writer.writerow([nazwa, procenty, cena, ocena, gwiazdek, kraj, region, url_oferta])
  51.  
  52.  
  53.             print("nazwa: " + nazwa)
  54.             print("procenty: " + procenty)
  55.             print("cena: " + cena)
  56.  
  57. # csv_file.close()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement