Advertisement
Guest User

Untitled

a guest
Oct 31st, 2014
141
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.27 KB | None | 0 0
  1. #!/usr/bin/python
  2.  
  3. import wikitools as wt
  4. from wikitools import wiki
  5. from wikitools import api
  6. import simplejson as json
  7. from sets import Set
  8. import re
  9. import csv
  10.  
  11. # create a Wiki object
  12. site = wt.Wiki('http://en.wikipedia.org/w/api.php')
  13.  
  14. # default params for API requests
  15. savefile = '../enwiki_geotagged.txt'
  16. articlelist = '../enwiki_noredirect.txt'
  17.  
  18. # read oldids
  19. print "Importing article list..."
  20. rf = open(articlelist, "r")
  21. #k=rf.read().split('\n')
  22. k=rf.readlines()
  23.  
  24.  
  25. # create the request object
  26. def call(params):
  27.     req = wt.APIRequest(site, params)
  28.     try:
  29.         res = req.query()
  30.     except wt.APIError, e:
  31.         res = ''
  32.     return res
  33.  
  34. # default parameters
  35. par1 = {
  36.     'action':'query',
  37.     'prop': 'templates',
  38.     'tllimit':'1',
  39.     'tltemplates': 'Template:Coord'
  40. }
  41.  
  42. rdone = 1
  43. # iterate through rev list
  44. for rev in k:
  45.     rev = rev.strip()
  46.     if len(rev)>0:
  47.         par1['titles'] = rev
  48.         print "--- Checking article: " + rev + "("+ str(rdone) +"/"+ str(len(k)) +")"
  49.         res = call(par1)
  50.         if len(res)>0:
  51.             rv = res['query']['pages']
  52.             key = rv.keys()[0]
  53.             #reponse is kosher
  54.             if 'templates' in rv[key].keys():
  55.                 print rev
  56.                 f=open(savefile,"a")
  57.                 f.write(rev + "\n")
  58.                 f.close()
  59.         else:
  60.             print "Could not retrieve a response from the API"
  61.         rdone+=1
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement