Advertisement
Guest User

Untitled

a guest
Oct 19th, 2017
288
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.14 KB | None | 0 0
  1. user_agent = "Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/28.0.1468.0 Safari/537.36"^M
  2. base_url = "http://www.imdb.com/title/"^M
  3. ^M
  4. def get_IMDB_page(imdb_id):
  5. url = base_url + imdb_id + "/"^M
  6. req = urllib2.Request(url)^M
  7. req.add_header('User-Agent', user_agent)^M
  8. socket.setdefaulttimeout(30)
  9. html = ""
  10. try:^M
  11. response = urllib2.urlopen(req)^M
  12. html=response.read()^M
  13. response.close()^M
  14. return html
  15. except urllib2.URLError as err: ^M
  16. defaultLog( addonLanguage(32505) % ( err ) )^M
  17. response.close()^M
  18. return html
  19. except socket.error as err:^M
  20. defaultLog( addonLanguage(32505) % ( err ) )^M
  21. response.close()^M
  22. return html
  23.  
  24. def parse_IMDb_page(imdb_id):^M
  25. do_loop = 1
  26. while do_loop == 1 :
  27. html = get_IMDB_page(imdb_id)
  28. if html == "":
  29. time.sleep(1)
  30. else:
  31. do_loop = 0
  32. soup = beautifulsoup(html)^M
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement