Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import sys
- import requests
- from bs4 import BeautifulSoup
- print('===== start =====')
- res = requests.get('https://tw.video.yahoo.com/')
- print(res.text)
- print('===== end =====')
- # save the result into 'soup'
- soup = BeautifulSoup(res.text, 'html.parser')
- linkArray = []
- titleArray = []
- combineArray = []
- pageLink = 'https://tw.video.yahoo.com/'
- for link in soup.find_all('a', class_="W(290px)"):
- linkArray.append(pageLink+link.get('href'))
- print(pageLink+link.get('href'))
- for title in soup.find_all('h2', class_="Fz(16px)"):
- titleArray.append(title.text)
- print(title.text)
- for i in range(len(linkArray)):
- combineArray.append(titleArray[i]+' '+linkArray[i])
- print(titleArray[i]+' '+linkArray[i])
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement