Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- from selenium import webdriver
- from bs4 import BeautifulSoup
- import re
- browser = webdriver.Chrome('/Users/kenny/Dropbox/Python/chromedriver')
- browser.get('https://www.ebay.com/sch/i.html?_from=R40&_nkw=watches&_sacat=0&_pgn=1')
- bs = BeautifulSoup(browser.page_source, 'lxml')
- browser.maximize_window()
- for items in bs.findAll('li', {'class': 's-item'}):
- link = items.findAll('a', href=True)
- print(link)
- # links = [a['href'] for a in bs.select('a[href]')]
- # links = bs.find('a', href=re.compile(r'[/]([a-z]|[A-Z])\w+')).attrs['href']
- # links = bs.findAll('a', attrs={'href': re.compile("^http://")})
- browser.close()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement