Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import urllib.request
- def getLinks(links):
- page = urllib.request.urlopen(links)
- numlinks = 0
- line = page.readline().decode('utf-8')
- while '< a href =' not in line:
- line = page.readline().decode('utf-8')
- line = page.readline().decode('utf-8')
- while '< a href =' not in line:
- numlinks = numlinks + 1
- line = page.readline().decode('utf-8')
- line = page.readline().decode('utf-8')
- while '> </a>' not in line:
- line = page.readline().decode('utf-8')
- line = page.readline().deode('utf-8')
- while line != "" and '> </a>' not in line:
- print (line[:-1])
- line = page.readline().decode('utf-8')
- print("number of links =",numlinks)
- page.close()
- print(getLinks('https://www.yahoo.com/'))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement