Advertisement
Guest User

Untitled

a guest
Jan 19th, 2017
80
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.23 KB | None | 0 0
  1. import requests
  2. from bs4 import BeautifulSoup
  3.  
  4. movielinkArray = []
  5. titleArray = []
  6. combineArray = []
  7. reviewsArray=[]
  8. movielink2Array = []
  9. idArray=[]
  10. id=''
  11. link=''
  12. def start():
  13.     for id in range(11):
  14.         link='https://tw.movies.yahoo.com/movie_intheaters.html?p='+str(id+1)
  15.         res = requests.get(link)
  16.         soup = BeautifulSoup(res.text, 'html.parser')
  17.         print("第"+str(id+1)+"頁========================================")
  18.         for link in soup.find_all('div',class_="row-container"):
  19.             titleArray.append(link.find('h4').text)
  20.             movielinkArray.append(link.find('h4').find('a').get('href'))
  21.             #print(link.find('h4').find('a').get('href'))
  22.             firstlevel(movielinkArray)    
  23.            
  24.          
  25.            
  26.            
  27. def firstlevel(movielinkArray):
  28.      link=''.join(movielinkArray)
  29.      res = requests.get(link)
  30.      soup = BeautifulSoup(res.text, 'html.parser')
  31.      for link in soup.find_all('li',class_="last"):
  32.          print("https://tw.movies.yahoo.com"+link.find('span').find('a').get('href'))
  33.          movielink2Array.append("https://tw.movies.yahoo.com"+link.find('span').find('a').get('href'))
  34.  
  35.          
  36. if __name__=='__main__':
  37.     start()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement