Advertisement
Guest User

Untitled

a guest
Jul 23rd, 2018
211
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.22 KB | None | 0 0
  1. import sys
  2. import requests
  3. import re
  4.  
  5.  
  6.  
  7. def check_for_redirects(url):
  8.     try:
  9.         r = requests.get(url if url.startswith('http') else "http://%s" % url, allow_redirects=True, timeout=7)
  10.         if strip_url(r.url) == strip_url(url):
  11.             return url
  12.         else:
  13.             return strip_url(r.url)
  14.     except requests.exceptions.Timeout:
  15.         return 'expired'
  16.     except requests.exceptions.ConnectionError:
  17.         return 'expired'
  18.  
  19. def strip_url(url):
  20.     url = url.replace("https://", "")
  21.     url = url.replace("http://", "")
  22.     try:
  23.         url = re.split("www\d*.", url)[1]
  24.     except:
  25.         pass
  26.     first_slash = url.find('/')
  27.     if first_slash != -1:
  28.         url = url[:first_slash]
  29.     return url.strip()
  30.  
  31.  
  32. def check_domains(urls, f):
  33.     for url in urls:
  34.         redirect_url = check_for_redirects(url)
  35.         print("%s - %s" % (url, redirect_url))
  36.         f.write("%s - %s" % (url, redirect_url) + '\n')
  37.  
  38.  
  39. if __name__ == '__main__':
  40.     fname = 'domain_list.txt'
  41.     out1 = open("out1", "w")
  42.     try:
  43.         fname = sys.argv[1]
  44.     except IndexError:
  45.         pass
  46.     urls = (l.strip() for l in open(fname).readlines())
  47.     check_domains(urls, out1)
  48.     out1.close()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement