Advertisement
Guest User

spider settings

a guest
May 8th, 2016
258
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.75 KB | None | 0 0
  1. # -*- coding: utf-8 -*-
  2.  
  3. # Scrapy settings for ia_check project
  4.  
  5. BOT_NAME = 'ia_check'
  6.  
  7. SPIDER_MODULES = ['ia_check.spiders']
  8. NEWSPIDER_MODULE = 'ia_check.spiders'
  9. DOWNLOAD_HANDLERS = {'s3':None}
  10.  
  11. DOWNLOADER_MIDDLEWARES = {
  12. 'scrapy_splash.SplashCookiesMiddleware': 723,
  13. 'scrapy_crawlera.CrawleraMiddleware': 600,
  14. 'scrapyjs.SplashMiddleware': 725
  15. }
  16.  
  17. SPLASH_URL = 'http://192.168.59.103:8050' # http://localhost:8050/
  18.  
  19. DUPEFILTER_CLASS = 'scrapyjs.SplashAwareDupeFilter'
  20. HTTPCACHE_STORAGE = 'scrapyjs.SplashAwareFSCacheStorage'
  21.  
  22. CRAWLERA_ENABLED = True
  23. CRAWLERA_APIKEY = '7ea1c5bc865849d4bbacba460e7122ac'
  24.  
  25. # DOWNLOAD_DELAY=3
  26. # The download delay setting will honor only one of:
  27. CONCURRENT_REQUESTS_PER_DOMAIN=16
  28. CONCURRENT_REQUESTS_PER_IP=16
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement