Advertisement
Guest User

Untitled

a guest
Oct 26th, 2016
283
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 4.09 KB | None | 0 0
  1. '''import requests
  2.  
  3. file = open('sqlerr.txt' , 'r')
  4. err_list = file.readlines()
  5. file.close()
  6. resp = requests.get('http://www.ya.ru')
  7. #print resp.text
  8. #err = 'DOCTYPE'
  9. err = str(err_list[0])
  10. err = err.strip()
  11. print err
  12. if resp.text.find(err)>0:
  13. print 'YES'
  14. else:
  15. print 'NO'
  16.  
  17. '''
  18. import requests
  19. import re
  20. import os
  21. import string
  22. #------------------------sqlerr.txt------------------------------
  23. file = open('sqlerr.txt' , 'r')
  24. err_list = file.readlines()
  25. file.close()
  26. print' ______________________________________'
  27. print'| |'
  28. print'| Parser dork from |'
  29. print'| _ |'
  30. print'| |_) o ._ _ _ _ ._ _ |'
  31. print'| |_) | | | (_| o (_ (_) | | | |'
  32. print'| _| |'
  33. print'|______________________________________|'
  34. print
  35. #--------------------------------------------------------------
  36. file = open('url_pars.txt', 'w')
  37. file.close()
  38. #search = raw_input('Text of dork (example:index.php?id=):')
  39. #search = 'post.php?id='
  40. #------------------Dorks list----------------------------------
  41. dorks = open('dorks.txt' , 'r')
  42. dorks_list = dorks.readlines()
  43. dorks.close()
  44. #--------------------------------------------------------------
  45. pages = int(raw_input('Number of page: '))*10
  46. #pages = 10
  47. for i in range(len(dorks_list)):
  48. search = dorks_list[i].strip()
  49. #print 'Number of dorks: '+str(len(dorks_list))
  50. print 'Use dork: '+search
  51. count = 1
  52. while (count < pages):
  53. #http://www.bing.com/search?q=index.php?id=&go=&filt=all&first=1&FORM=PERE3
  54. req = ('http://www.bing.com/search?q=' + search + '&first='+str(count))
  55. try:
  56. response = requests.get(req)
  57. except:
  58. print 'Error get bing.com'
  59. #print response.text
  60. req = ''
  61. try:
  62. link = re.findall('<h2><a href="(.+?)"', response.text, re.DOTALL)
  63. for i in range(len(link)):
  64. #print link[i]
  65. #if link[i].find('yandex'):
  66. # print 'YANDEX'
  67. #else:
  68. if link[i].find('http://bs.yandex.ru'):
  69. print 'url: '+link[i]
  70. open('url_pars.txt', 'a+').write(link[i] +'\'' + '\n')
  71. #else:
  72. #print 'ya'
  73. #count = count+10
  74. #print count
  75. except:
  76. print 'Error parsing url'
  77. count = count+10
  78. #print count
  79. #---------------------Delete duplicates-------------------------
  80. def f7(seq):
  81. seen = set()
  82. seen_add = seen.add
  83. return [ x for x in seq if not (x in seen or seen_add(x))]
  84.  
  85. print 'Removing duplicates...'
  86. input = open('url_pars.txt', 'r')
  87. output = open('url.txt', 'w')
  88. linesarray = input.readlines()
  89. input.close()
  90. seen = []
  91. seen = f7(linesarray)
  92. print(seen)
  93. for i in range(len(seen)):
  94. output.write(seen[i])
  95. '''linesarray = input.readlines()
  96. input.close()
  97. seen = []
  98. for i in range(len(linesarray)):
  99. if seen.count(linesarray[i]) == 0:
  100. seen.append(linesarray[i])
  101. #if linesarray[i].find('http://bs.yandex.ru'):
  102. output.write(linesarray[i])'''
  103. #else:
  104. #print 'ya'
  105.  
  106. #os.remove('url_pars.txt')
  107. output.close()
  108. print 'Complete'
  109. print 'Checking error...'
  110. #-------------------------url.txt--------------------------------
  111. file = open('url_pars.txt' , 'r')
  112. url_list = file.readlines()
  113. file.close()
  114. #------------------------Proverka--------------------------------
  115. err_page = 0
  116. good_page = 0
  117. for i in range(len(url_list)):
  118. page = url_list[i].strip()
  119. print page
  120. try:
  121. responce = requests.get(page)
  122. except Exception, e:
  123. err_page = err_page+1
  124. else:
  125. for i in range(len(err_list)):
  126. err = str(err_list[i])
  127. err = err.strip()
  128. if responce.text.find(err)>0:
  129. print 'FIND "'+err+'" in '+page
  130. open('good.txt', 'a+').write(page + '\n')
  131. good_page = good_page + 1
  132. #else:
  133. #print ''
  134. #-------------------------------------------------------------------
  135. print 'Good pages: '+str(good_page)
  136. print '404,403 pages: '+str(err_page)
  137. print 'Complete. Press any key...'
  138. raw_input()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement