Advertisement
Guest User

Untitled

a guest
Jan 23rd, 2017
132
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.93 KB | None | 0 0
  1.     def UrlConstructor(self, date_list):
  2.         urlcommon = "https://ria.ru/politics/"
  3.         index = 0
  4.         current_day = date_list[index]
  5.         lst = ['{0:09d}'.format(j) for j in xrange(1485048700, 1487000000)]
  6.         for i in lst:
  7.             print i
  8.             url = urlcommon + str(current_day).replace("-", '') + "/" + i + ".html"
  9.             print url
  10.             if self.CheckValid(url) == True:
  11.                 with codecs.open("listOfArticlePaths.txt", 'a') as f:
  12.                     f.write(url + "\n")
  13.                 print("я нашел статью и записал ее, вот: " + url)
  14.             else:
  15.                 if index+1 < len(date_list):
  16.                     url = urlcommon + str(date_list[index+1]).replace("-", '') + "/" + i + ".html"
  17.                     if self.CheckValid(url) == True:
  18.                         current_day = date_list[index+1]
  19.                 else:
  20.                     return
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement