Advertisement
Guest User

Untitled

a guest
Apr 18th, 2018
88
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.88 KB | None | 0 0
  1. from bs4 import BeautifulSoup
  2. import urllib, requests
  3.  
  4. user = "whitenoi"
  5. password = "t1ibkMhNzg"
  6. url = "http://www.whitenoiserecords.org/archives/date/2018/01/page/4"
  7. response = requests.get(url,verify=False, auth=(user, password))
  8. soup = BeautifulSoup(response.content, "html.parser")
  9. stuff = soup.find_all("div", class_="post-alt blog")
  10.  
  11. count = 1
  12.  
  13. for experiment in stuff:
  14.     if count < 11:
  15.         data = []
  16.         data.append(str(experiment.find('a')['href']))
  17.  
  18.         for div in experiment.findAll('a'):
  19.             string = str(div.contents[0])
  20.             data.append(string.strip())
  21.  
  22.         print(count)
  23.         print("Link is ", data[0])
  24.         print("Album ", data[1])
  25.         print("Artist ", data[2])
  26.         print("Country ", data[3])
  27.         print("Label ", data[4])
  28.         genre = ",".join(data[5:])
  29.         print("Genre ", genre)
  30.     count += 1
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement