Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import requests
- import bs4
- import re
- import sys
- rr = re.findall('https:\/\/2ch.hk\/([A-z0-9]+)\/res\/([0-9]+).html', str(sys.argv[1]))
- if len(rr)>0:
- r = requests.get(str(sys.argv[1]))
- s = bs4.BeautifulSoup(r.text, 'lxml')
- z = s.find_all('a', {'class':'desktop', 'target':'_blank'})
- for i in xrange(len(z)):
- fn = re.findall('../src/[0-9]+/(.+)', z[i]['href'])
- print rr[0][0], rr[0][1], fn
- print
- f = open(fn[0], 'wb')
- rc = requests.get('https://2ch.hk/'+rr[0][0]+'/src/'+rr[0][1]+'/'+fn[0])
- f.write(rc.content)
- f.close()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement