Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import re
- import requests as req
- re_coin_link = re.compile(r'(http\S+coins?.htm)', re.DOTALL)
- rss_url = 'http://www.cbr.ru/rss/RssPress'
- resp_rss = req.get(rss_url)
- press_relise_coin_url = re_coin_link.findall(resp_rss.text)
- dates = []
- for i in press_relise_coin_url:
- resp_html_press_relise = req.get(i)
- html_press_relise = resp_html_press_relise.text
- clear_html_press_relise = re.sub(r' |«|»', ' ', html_press_relise,flags = re.DOTALL)
- re_date = re.compile(r'Банк России\s(\d*)\s([а-яА-Я]*)\s(\d*).*выпускает в обращение', re.DOTALL)
- get_date = re_date.findall(clear_html_press_relise)
- # print(get_date)
- dates.append(list({"date": x[0], 'month': x[1], "year": x[2]} for x in get_date))
- # print(cont)
- print(dates)
Add Comment
Please, Sign In to add comment