Advertisement
Guest User

Untitled

a guest
Oct 21st, 2014
178
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.20 KB | None | 0 0
  1. In [1]: from bs4 import BeautifulSoup as bsoup
  2.  
  3. In [2]: import requests as rq
  4.  
  5. In [3]: url = "http://www.livescore.com/soccer/champions-league/"
  6.  
  7. In [4]: r = rq.get(url)
  8.  
  9. In [5]: bs = bsoup(r.text)
  10.  
  11. In [6]: links = bs.find_all("a", class_="scorelink")
  12.  
  13. In [7]: links
  14. Out[7]:
  15. [<a class="scorelink" href="/soccer/champions-league/group-a/atletico-madrid-vs-malmo-ff/1-1821150/" onclick="return false;">? - ?</a>,
  16. <a class="scorelink" href="/soccer/champions-league/group-a/olympiakos-vs-juventus/1-1821151/" onclick="return false;">? - ?</a>,
  17. ...
  18.  
  19. In [8]: links_clean = [link for link in links if link.get_text() != "? - ?"]
  20.  
  21. In [9]: links_clean
  22. Out[9]:
  23. [<a class="scorelink" href="/soccer/champions-league/group-e/cska-moscow-vs-manchester-city/1-1821202/" onclick="return false;">0 - 1</a>,
  24. <a class="scorelink" href="/soccer/champions-league/qualifying-round/zenit-st-petersburg-vs-standard-liege/1-1801440/" onclick="return false;">3 - 0</a>,
  25. ...
  26.  
  27. In [10]: links_final = [link["href"] for link in links_clean]
  28.  
  29. In [11]: links_final
  30. Out[11]:
  31. ['/soccer/champions-league/group-e/cska-moscow-vs-manchester-city/1-1821202/',
  32. '/soccer/champions-league/qualifying-round/zenit-st-petersburg-vs-standard-liege/1-1801440/',
  33. ...
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement