Advertisement
Guest User

main.py

a guest
Jan 7th, 2022
251
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.45 KB | None | 0 0
  1. import requests
  2. from bs4 import BeautifulSoup
  3. from datetime import datetime, timedelta
  4.  
  5. xtime = datetime.now()
  6. ytime = xtime - timedelta(hours=0, minutes=43)
  7. today = 'Сегодня'
  8. URL = 'https://www.olx.ua/nedvizhimost/kvartiry/prodazha-kvartir/1-komnata/kiev/?search%5Bfilter_enum_commission%5D' \
  9.       '%5B0%5D=1&search%5Bfilter_float_total_area%3Ato%5D=60&search%5Bprivate_business%5D=private '
  10. HEADERS = {'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:71.0) Gecko/20100101 Firefox/71.0',
  11.            'accept': '*/*'}
  12.  
  13. HOST = 'http://www.olx.ua'
  14.  
  15.  
  16. def get_html(url, params=None):
  17.     req = requests.get(url, headers=HEADERS, params=params)
  18.     return req
  19.  
  20.  
  21. def get_content(html):
  22.     soup = BeautifulSoup(html, 'html.parser')
  23.     table = soup.find('table', {'id': 'offers_table'})
  24.     items = table.find_all('tr', class_='wrap')
  25.     houses = []
  26.     for item in items:
  27.             houses.append({'Название': item.find('strong').text,
  28.                            'Ссылка': item.find('a').get('href'),
  29.                            'Цена': item.find('p', {'class': 'price'}).text,
  30.                            'Время Публикации': item.find('i', {'data-icon': 'clock'}).parent.text
  31.                            })
  32.     return houses
  33.  
  34.  
  35. def parse():
  36.     html = get_html(URL)
  37.     if html.status_code == 200:
  38.         test = get_content(html.text)
  39.         return test
  40.     else:
  41.         print('Error')
  42.  
  43.  
  44. parse()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement