Advertisement
Guest User

Untitled

a guest
Jun 30th, 2016
65
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.18 KB | None | 0 0
  1. import sys
  2. reload(sys)
  3. sys.setdefaultencoding("utf-8")
  4. sys.path.insert(0, 'libs')
  5. import webapp2
  6. from bs4 import BeautifulSoup
  7. import math
  8. import urllib2
  9.  
  10. class MainPage(webapp2.RequestHandler):
  11. def get(self, args1, args2):
  12.  
  13. url = "http://emart.ssg.com/category/list.ssg?dispCtgId="
  14. url += str(args1)
  15. url += "&page="
  16. url += str(args2)
  17.  
  18. print("log_print" + url);
  19. data = ""
  20. source_code = urllib2.urlopen(url).read()
  21. plain_text = source_code
  22. soup = BeautifulSoup(plain_text, "html.parser")
  23.  
  24. for info_list in soup.find("tbody").find_all(class_="item w202"):
  25. title = info_list.find(class_="title").a["title"]
  26.  
  27. if title is None:
  28. continue
  29. else:
  30. data += title
  31. data += "t"
  32.  
  33. price = info_list.find(class_="price")
  34.  
  35. if price is None:
  36. continue
  37. else:
  38. data += price.strong.string
  39. data += "t"
  40.  
  41. img_url = info_list.find(class_="thm").a.img["src"]
  42.  
  43. if img_url is None:
  44. continue
  45. else:
  46. data += "http:" + img_url
  47. data += "t"
  48.  
  49. code = img_url.split("/")[7].split("_")[0]
  50.  
  51. data += code + "n"
  52.  
  53. self.response.write(data)
  54.  
  55. app = webapp2.WSGIApplication([('/emart_product_v2/(d+)_(d+)', MainPage),], debug=True)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement