Advertisement
Guest User

crawler

a guest
Apr 5th, 2020
1,314
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.89 KB | None | 0 0
  1. import sys
  2. from bs4 import BeautifulSoup
  3. import requests
  4. import urllib.request
  5.  
  6. base_url = 'https://news.naver.com/main/main.nhn?mode=LSD&mid=shm&sid1='
  7. category = [100, 101, 102, 103, 104, 105] #정치, 경제, 사회, 생활문화, 세계, 생활과학
  8. category = [100]
  9.  
  10. for i in category:
  11.     URL = base_url + str(i)
  12.     response = urllib.request.urlopen(URL)
  13.     soup = BeautifulSoup(response, "html.parser")
  14.     #results = soup.select("#section_body .photo a")
  15.     results = soup.select("#section_body")
  16.     print(results)
  17.     #print(response)
  18. #    print(soup)
  19.     #print(URL)
  20. #    for result in results:
  21. #        print("제목 : ", result.attrs["title"])
  22. #        url_article = result.attrs["href"]
  23. #        response = urllib.request.urlopen(url_article)
  24. #        soup_article = BeautifulSoup(response, "html.parser")
  25. #        content = soup_article.select_one("#articleBodyContents")
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement