Advertisement
Guest User

Untitled

a guest
May 25th, 2018
66
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.48 KB | None | 0 0
  1. def soething(self):
  2.     self.agency_url_list = []
  3.     for i, page_url in enumerate(pages_urls):
  4.         yield scrapy.Request(
  5.             page_url, callback=self.parse_agency_urls, dont_filter=True
  6.         )
  7.     print self.agency_url_list
  8.  
  9. def parse_agency_urls(self, response):
  10.     urls = response.xpath("//a[contains(@class, 'catalog__cell-content')]/@href").re('.*')
  11.     urls = filter(lambda x: x != '', urls)
  12.     for url in urls:
  13.         self.agency_url_list.append(url)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement