Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import requests
- from bs4 import BeautifulSoup
- from datetime import datetime, timedelta
- xtime = datetime.now()
- ytime = xtime - timedelta(hours=0, minutes=43)
- today = 'Сегодня'
- URL = 'https://www.olx.ua/nedvizhimost/kvartiry/prodazha-kvartir/1-komnata/kiev/?search%5Bfilter_enum_commission%5D' \
- '%5B0%5D=1&search%5Bfilter_float_total_area%3Ato%5D=60&search%5Bprivate_business%5D=private '
- HEADERS = {'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:71.0) Gecko/20100101 Firefox/71.0',
- 'accept': '*/*'}
- HOST = 'http://www.olx.ua'
- def get_html(url, params=None):
- req = requests.get(url, headers=HEADERS, params=params)
- return req
- def get_content(html):
- soup = BeautifulSoup(html, 'html.parser')
- table = soup.find('table', {'id': 'offers_table'})
- items = table.find_all('tr', class_='wrap')
- houses = []
- for item in items:
- houses.append({'Название': item.find('strong').text,
- 'Ссылка': item.find('a').get('href'),
- 'Цена': item.find('p', {'class': 'price'}).text,
- 'Время Публикации': item.find('i', {'data-icon': 'clock'}).parent.text
- })
- return houses
- def parse():
- html = get_html(URL)
- if html.status_code == 200:
- test = get_content(html.text)
- return test
- else:
- print('Error')
- parse()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement