Advertisement
Guest User

Untitled

a guest
Feb 20th, 2020
93
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 2.05 KB | None | 0 0
  1. from selenium import webdriver
  2. import selenium.webdriver
  3. from selenium.webdriver.common.by import By
  4. from selenium.webdriver.common.keys import Keys
  5. import time
  6. import pickle
  7. import os.path
  8. import schedule
  9. import sched, time
  10. import traceback
  11. import apscheduler.triggers.cron
  12. from apscheduler.schedulers.blocking import BlockingScheduler
  13. from selenium.webdriver.firefox.options import Options
  14.  
  15. def webscraper():
  16. print("by: nuno silva :p")
  17. options = Options()
  18. browser = webdriver.Firefox()
  19.  
  20. browser.get('https://www.expireddomains.net/login/')
  21. elem = browser.find_element_by_id('inputLogin')
  22. elem.send_keys('asjdioasd');
  23. time.sleep(2)
  24. elem = browser.find_element(By.XPATH, '//input[@type="password"]')
  25. elem.send_keys('DrSNVDwaLX');
  26. time.sleep(2)
  27.  
  28. browser.find_element(By.XPATH, '//button[text()="Login"]').click()
  29. time.sleep(2)
  30.  
  31. count = 0;
  32. with open('domains_com.txt', 'a') as file:
  33. for j in range(1,500):
  34. browser.get('https://member.expireddomains.net/domains/expiredcom/?start='+str(count))
  35. time.sleep(5)
  36. count = count + 25;
  37. for x in range(1,26):
  38. domainname = browser.find_element(By.XPATH, "//div[@id='content']/div/div[2]/table/tbody/tr["+str(x)+"]/td/a").text
  39. backlinks = browser.find_element(By.XPATH, "//div[@id='content']/div/div[2]/table/tbody/tr["+str(x)+"]/td[4]").text
  40. try:
  41. if int(backlinks)>10 or "K" in backlinks:
  42. file.write (domainname +" - "+ backlinks + "\n")
  43.  
  44. except:
  45. file.write (domainname +" - "+ backlinks + "\n")
  46. file.flush()
  47. os.fsync(file)
  48.  
  49.  
  50.  
  51.  
  52.  
  53.  
  54. webscraper();
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement