Advertisement
Guest User

2chhkimgdl.py

a guest
Aug 22nd, 2016
162
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.54 KB | None | 0 0
  1. import requests
  2. import bs4
  3. import re
  4. import sys
  5.  
  6. rr = re.findall('https:\/\/2ch.hk\/([A-z0-9]+)\/res\/([0-9]+).html', str(sys.argv[1]))
  7. if len(rr)>0:
  8.     r = requests.get(str(sys.argv[1]))
  9.     s = bs4.BeautifulSoup(r.text, 'lxml')
  10.     z = s.find_all('a', {'class':'desktop', 'target':'_blank'})
  11.     for i in xrange(len(z)):
  12.         fn = re.findall('../src/[0-9]+/(.+)', z[i]['href'])
  13.         print rr[0][0], rr[0][1], fn
  14.         print
  15.         f = open(fn[0], 'wb')
  16.         rc = requests.get('https://2ch.hk/'+rr[0][0]+'/src/'+rr[0][1]+'/'+fn[0])
  17.         f.write(rc.content)
  18.         f.close()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement