Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- ----------------------
- def get_ad_data(ad, ads_len, signal, status_bar_signal):
- try:
- full_descr = get_full_descr(url, ads_len, signal, status_bar_signal)
- except:
- full_descr = ''
- try:
- name_adv = get_name_adv(url, ads_len, signal, status_bar_signal)
- except:
- name_adv = 'namenone'
- data = {'advname': name_adv,
- 'description': full_descr,
- }
- write_csv(data)
- -----------------------
- def get_name_adv(url, ads_len, signal, status_bar_signal):
- global percents
- try:
- html = get_html(url)
- soup = BeautifulSoup(html, 'lxml')
- good_page_test = soup.find('div', class_='item-view-header').find_all('h1')
- except:
- html = get_html_proxy(url, signal)
- soup = BeautifulSoup(html, 'lxml')
- name_adv_a = soup.find('div', class_='seller-info-name').find_all('a')
- else:
- name_adv_a = soup.find('div', class_='seller-info-name').find_all('a')
- finally:
- name_adv = ""
- for a in name_adv_a:
- name_adv += a.text
- percents = percents + (100 / ads_len)
- status_bar_signal.emit(int(percents))
- return name_adv
- -------------------------------
- def get_full_descr(url, ads_len, signal, status_bar_signal):
- global percents
- try:
- html = get_html(url)
- soup = BeautifulSoup(html, 'lxml')
- good_page_test = soup.find('div', class_='item-view-header').find_all('h1')
- except:
- html = get_html_proxy(url, signal)
- soup = BeautifulSoup(html, 'lxml')
- full_descr_p = soup.find('div', class_='item-description-text').find_all('p')
- else:
- full_descr_p = soup.find('div', class_='item-description-text').find_all('p')
- finally:
- full_descr = ""
- for p in full_descr_p:
- full_descr += p.text
- percents = percents + (100 / ads_len)
- status_bar_signal.emit(int(percents))
- return full_descr
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement