Advertisement
Guest User

Untitled

a guest
Jun 22nd, 2017
64
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.46 KB | None | 0 0
  1. import scrapy
  2. from articles_crawler.items import SubjectItem, AuthorItem, ArticleItem
  3.  
  4. class ArticlesSpider(scrapy.spiders.XMLFeedSpider):
  5. name = "articles"
  6. start_urls = ['http://gizmodo.uol.com.br/feed/']
  7. iterator = 'xml'
  8. itertag = 'item'
  9.  
  10. def parse_node(self, response, node):
  11. node.remove_namespaces()
  12. authorItem = AuthorItem()
  13. authorItem['name'] = node.xpath('//creator/text()').extract()
  14. return authorItem
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement