Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- #!/usr/bin/env python
- from urllib2 import urlopen
- from sys import argv, exit
- from re import findall
- def main(URL):
- html = urlopen(URL).read()
- links = findall(r'<a href="(\S+)">', html)
- f = open('URLs.txt', 'w')
- for link in links:
- f.write(link + '\n')
- if __name__ == '__main__':
- if len(argv) == 2:
- main(argv[1])
- else:
- exit('Usage: ./scrape.py URL')
Add Comment
Please, Sign In to add comment