Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- from bs4 import BeautifulSoup
- import urllib, requests
- user = "whitenoi"
- password = "t1ibkMhNzg"
- url = "http://www.whitenoiserecords.org/archives/date/2018/01/page/4"
- response = requests.get(url,verify=False, auth=(user, password))
- soup = BeautifulSoup(response.content, "html.parser")
- stuff = soup.find_all("div", class_="post-alt blog")
- count = 1
- for experiment in stuff:
- if count < 11:
- data = []
- data.append(str(experiment.find('a')['href']))
- for div in experiment.findAll('a'):
- string = str(div.contents[0])
- data.append(string.strip())
- print(count)
- print("Link is ", data[0])
- print("Album ", data[1])
- print("Artist ", data[2])
- print("Country ", data[3])
- print("Label ", data[4])
- genre = ",".join(data[5:])
- print("Genre ", genre)
- count += 1
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement