Advertisement
Guest User

Untitled

a guest
Jul 26th, 2017
96
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.86 KB | None | 0 0
  1. import scrapy
  2. from shopclues.items import ShopcluesItem
  3. from scrapy.contrib.spiders import CrawlSpider, Rule
  4. from scrapy.contrib.linkextractors.sgml import SgmlLinkExtractor
  5.  
  6. class ShopcluesSpider(scrapy.Spider):
  7. name = 'shopclues'
  8. allowed_domains = ['http://www.shopclues.com/search?
  9. q=samsung&sc_z=4444&z=0']
  10. start_urls = ['http://www.shopclues.com/search?
  11. q=samsung&sc_z=4444&z=0/']
  12. rules = (
  13. Rule(SgmlLinkExtractor(allow=()), callback="parse_items", follow=
  14. True))
  15. def parse(self, response):
  16. prices =
  17. response.xpath('//span[@class="p_price"]/text()').extract()
  18. discounts =
  19. response.xpath('//span[@class="prd_discount"]/text()').extract()
  20. for item in zip(prices,discounts):
  21. scraped_info = {
  22. 'prices' : item[0],
  23.  
  24. 'discounts' : item[1]
  25. }
  26. yield scraped_info
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement