Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- # -*- coding: utf-8 -*-
- from selenium import webdriver
- from selenium.webdriver.common.keys import Keys
- from time import sleep
- import pandas as pd
- options = webdriver.ChromeOptions()
- options.add_argument('disable-infobars')
- # add here any tag you want.
- browser = webdriver.Chrome(chrome_options=options)
- value = 135
- browser.get("https://forum.gamer.com.tw/B.php?bsn=60076&subbsn=0")
- #One = browser.get("https://forum.gamer.com.tw/Bo.php?bsn=60076&q=j2492104")
- browser.find_element_by_class_name("material-icons").click()
- sleep(0.3)
- a = browser.find_elements_by_class_name("gcse-sort-title")[1]
- a.click()
- sleep(0.3)
- browser.find_element_by_id("old_search_input").send_keys("j2492104")
- browser.find_element_by_id("old_search_input").send_keys(Keys.ENTER)
- sleep(0.3)
- while(value) >0:
- print(value)
- browser.get("https://forum.gamer.com.tw/Bo.php?page="+str(value)+"&bsn=60076&q=j2492104&tnum=1342")
- sleep(0.3)
- b = browser.find_elements_by_xpath("//a[@data-gtm='Bo頁文章列表']")
- sleep(0.3)
- c = len(b)
- while (c) > 0 :
- c-=1
- sleep(0.5)
- testTime = browser.find_elements_by_class_name("FM-blist6")
- testa = browser.find_elements_by_xpath("//a[@data-gtm='Bo頁文章列表']")
- wordone = testa[c].text
- wordtwo = testTime[c].text
- testa[c].click()
- sleep(0.5)
- texta = browser.find_element_by_class_name("c-article__content")
- dict = {
- "==":"======",
- "主題": wordone,
- "日期": wordtwo,
- "=":"======",
- "內容": texta.text,
- }
- select = pd.Series(dict, index = dict.keys())
- select.to_csv("text.csv",mode='a', header=False)
- sleep(0.5)
- browser.back()
- value -=1
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement