Advertisement
Mysakure

bzoj data spider

Oct 12th, 2019
137
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.21 KB | None | 0 0
  1. # -*- coding: utf-8 -*-
  2. import requests
  3. import sys
  4. import re
  5. import os
  6. import time
  7. def mkdir(path):
  8.   folder=os.path.exists(path)
  9.   if not folder:
  10.     if not folder:
  11.       os.makedirs(path)
  12.  
  13. r_url="http://darkbzoj.tk/data/"
  14. root="C:\\Users\MySakure\OneDrive - smail.hunnu.edu.cn\\task\\bzoj\\"
  15. headers = {'Cookie': '__cfduid=d6faa192ae5f2d57da950ac0bd056eaf41569333917; PHPSESSID=5fcsgf440g962ur3bpk13nej97; uoj_username=Mysakure; uoj_username_checksum=45fd50199b1b6c5949aeee8b15b6b16d; uoj_remember_token=pfAW5yNe7AMZ06fGoCZpIHcBnhxxmceuBzupe1V4lAzuUtD3BC48lNCWRc2e; uoj_remember_token_checksum=b8a77a027da07c1d22fff455d95b959e; uoj_preferred_language=C%2B%2B; cf_clearance=cb17d6598a9dc1a328a1c07764b842545a44b5ca-1570937841-0-150',
  16.   'Host': 'darkbzoj.tk',
  17. 'Pragma': 'no-cache',
  18. 'Referer': 'http://darkbzoj.tk/data/',
  19.   'Sec-Fetch-Mode': 'no-cors',
  20. 'User-Agent': 'Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/77.0.3865.90 Mobile Safari/537.36'}
  21. for i in range(1000,4999):
  22.   url=r_url+str(i)+".zip"
  23.   print(url)
  24.   zip=requests.get(url,headers=headers)
  25.   with open(root + str(i) + ".zip", 'wb') as file:
  26.     file.write(zip.content)
  27.     #time.sleep(1)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement