Ashies

ASSIGNMENT1 CODE

Jan 18th, 2019
42
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.97 KB | None | 0 0
  1. # -*- coding: utf-8 -*-
  2. """
  3. Created on Thu Jan 17 23:12:53 2019
  4.  
  5. @author: Ashishn
  6. """
  7.  
  8.  
  9. driver.get('https://science.iit.edu/people/faculty')
  10.  
  11. #source = driver.page_source
  12. #elements = driver.find_elements_by_class_name('views-field views-field-nothing col-xs-10')
  13. elements = driver.find_elements(By.CLASS_NAME,"views-field") #NEED SPECIFIC CLASS NAME FOR OPTIMIZATION
  14.  
  15. linkList = []    
  16. for oneFaculty in elements:
  17.     try:    
  18.         element = oneFaculty.find_elements_by_tag_name("div")
  19.         linkIs = element[0].find_elements_by_tag_name("a")[0].get_attribute("href")
  20.        
  21.         #trash link condition
  22.         if(linkIs == "https://science.iit.edu/%5Bpath%5D"):
  23.             pass
  24.         else:
  25.             linkList.append(linkIs)
  26.     except:
  27.         pass    
  28.  
  29. from selenium import webdriver
  30. import pandas as pd
  31.  
  32. from selenium.webdriver.common.by import By
  33. driver = webdriver.Chrome(executable_path ='C:\Program Files (x86)\Google\chromedriver.exe')
  34.  
  35. for inDetails in linkList:
  36.     #hitting again with same object
  37.     driver.get(inDetails)
  38.     name = driver.find_element(By.CLASS_NAME,"rdf-meta")
  39.     NAME = name.get_attribute('content')
  40.     TITLE = driver.find_element_by_css_selector(".field.field-name-field-faculty-image.field-type-image.field-label-hidden.view-mode-full")
  41.     print(TITLE)                                
  42.     #TITLE = driver.find_element()
  43.     #source = driver.page_source
  44.     print(name.text)
  45.     #nameis = driver.find_elements(By.ID,"page-title")
  46.     #print(nameis[0].text)
  47.    
  48.    
  49.     break
  50.    
  51.  
  52. #.find_element_by_css_selector('a').get_attribute('href')
  53.  
  54.  
  55. #language_element = driver.find_elements_by_xpath('//[@class=’views-field views-field-nothing col-xs-10 faculty-name’]')
  56.  
  57.  
  58.  
  59. driver.close()
  60.  
  61.  
  62.  
  63. #####################
  64.  
  65. .field.field-name-field-faculty-title field-type-text.field-label-hidden.view-mode-ful
  66.  
  67. response = HtmlResponse(url = 'https://science.iit.edu/people/faculty', body = source, encoding='utf-8')
Add Comment
Please, Sign In to add comment