Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- def parse_article(self, response):
- def extract_with_css(query):
- result = response.css(query).extract_first().strip()
- res = re.sub(r'<.*?>', '', result)
- return res
- item = ScrapyArticlesItem()
- item['name'] = extract_with_css('h1.post__title.post__title_full span::text')
- item['article'] = extract_with_css('div.post__text.post__text-html.js-mediator-article')
- yield item
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement