Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- # script to read an xml file, and pull down (via wget) the ted talks from them.
- import os
- def box(num, low, up):
- if (low = num):
- return 1
- if (num >= up):
- return 2
- return 0
- def main(ptr, start, stop):
- f = open(ptr, "r")
- fname = ""
- count = 0;
- while True:
- s = f.readline()
- if "file name=" in s:
- count += 1
- print count
- if box(count, start, stop) == 0:
- fname = s.split('"')[1]
- fname = fname.split("/")[1]
- f.readline()
- u = f.readline()[33:-7]
- os.system('wget -c -O "talks/%s" %s' % (fname, u))
- #print 'wget -c -O "talks/%s" %s' % (fname, u)
- elif box(count, start, stop) == 2:
- break
- elif "</metalink>" in s:
- break
- f.close()
- if __name__ == "__main__":
- import sys
- if len(sys.argv) != 4:
- print "Expected 3 args. <filename> <start> <stop>"
- else:
- main(sys.argv[1], int(sys.argv[2]), int(sys.argv[3]))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement