Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- In [1]: from bs4 import BeautifulSoup as bsoup
- In [2]: import requests as rq
- In [3]: url = "http://www.livescore.com/soccer/champions-league/"
- In [4]: r = rq.get(url)
- In [5]: bs = bsoup(r.text)
- In [6]: links = bs.find_all("a", class_="scorelink")
- In [7]: links
- Out[7]:
- [<a class="scorelink" href="/soccer/champions-league/group-a/atletico-madrid-vs-malmo-ff/1-1821150/" onclick="return false;">? - ?</a>,
- <a class="scorelink" href="/soccer/champions-league/group-a/olympiakos-vs-juventus/1-1821151/" onclick="return false;">? - ?</a>,
- ...
- In [8]: links_clean = [link for link in links if link.get_text() != "? - ?"]
- In [9]: links_clean
- Out[9]:
- [<a class="scorelink" href="/soccer/champions-league/group-e/cska-moscow-vs-manchester-city/1-1821202/" onclick="return false;">0 - 1</a>,
- <a class="scorelink" href="/soccer/champions-league/qualifying-round/zenit-st-petersburg-vs-standard-liege/1-1801440/" onclick="return false;">3 - 0</a>,
- ...
- In [10]: links_final = [link["href"] for link in links_clean]
- In [11]: links_final
- Out[11]:
- ['/soccer/champions-league/group-e/cska-moscow-vs-manchester-city/1-1821202/',
- '/soccer/champions-league/qualifying-round/zenit-st-petersburg-vs-standard-liege/1-1801440/',
- ...
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement