準備軟件
- python 環境
- 在cmd窗口下載selenium,
pip install selenium
,添加鏈接描述
- 安裝谷歌驅動
代碼
- 修改url就可以
from selenium import webdriver
import time
url = 'https://www.toutiao.com/search/?keyword=%E6%A2%81%E8%80%81%E5%B8%88%E8%AE%B2%E7%B3%96'
executable_path="D://chromedriver_win32/chromedriver.exe"
driver = webdriver.Chrome(executable_path=executable_path)
driver.get(url=url)
time.sleep(5)
js = "var q=document.documentElement.scrollTop=100000000"
driver.execute_script(js)
time.sleep(2)
js = "var q=document.documentElement.scrollTop=10000"
driver.execute_script(js)
time.sleep(2)
js = "var q=document.documentElement.scrollTop=10000"
driver.execute_script(js)
time.sleep(2)
js = "var q=document.documentElement.scrollTop=10000"
driver.execute_script(js)
time.sleep(2)
js = "var q=document.documentElement.scrollTop=10000"
driver.execute_script(js)
weblist=driver.find_elements_by_xpath("""//*[@class = 'link title']""")
i=0
li=[]
for web in weblist:
url=web.get_attribute("href")
print(url)
li.append(url)
while True:
for u in li:
driver.get(u)
time.sleep(1)
js = "var q=document.documentElement.scrollTop=10000"
driver.execute_script(js)
print(i)
i+=1
time.sleep(1)
driver.quit()