Advertisement
Guest User

Untitled

a guest
Jul 1st, 2015
179
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.87 KB | None | 0 0
  1. import argparse
  2. import requests
  3. import os
  4. from lxml import html
  5.  
  6. parser = argparse.ArgumentParser()
  7. parser.add_argument("url", type=str,
  8. help="download an slideshare presentation given the url")
  9. args = parser.parse_args()
  10.  
  11.  
  12. def slideshare_down(request_url):
  13. page = requests.get(request_url)
  14. tree = html.fromstring(page.text)
  15. counter = 1
  16.  
  17. all_images = tree.xpath('//img[@class="slide_image"]')
  18. print(("Downloading presentation images."))
  19. for img in all_images:
  20. file_url = img.get("data-full")
  21.  
  22. input_page = "slide_%d.jpg" % counter
  23. os.system('curl -s "%s" -o %s' % (file_url, input_page))
  24.  
  25. counter += 1
  26.  
  27. print("Merging images with ImageMagick, please wait.")
  28. os.system('convert -density 300 *.jpg -quality 100 presentation.pdf')
  29. os.system('rm slide_*.jpg')
  30. print("Done!")
  31.  
  32. slideshare_down(args.url)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement