1、安裝selenium
pip install selenium
2、打開瀏覽器登錄獲取cookie
from selenium import webdriver import time import json driver = webdriver.Chrome() # 創建Chrome對象. # 操作這個對象. driver.get('https://baidu.com') # get方式訪問 time.sleep(5) el = driver.find_element_by_xpath("//input[@type='text']") el.send_keys('***********') time.sleep(2) el = driver.find_element_by_xpath("//input[@type='password']") el.send_keys('*****') time.sleep(2) el = driver.find_element_by_id("submit-login") el.click() time.sleep(2) #獲取網站cookie diccookie=driver.get_cookies() fw=open('cookie.txt','w') json.dump(diccookie,fw) fw.close() #driver.get_screenshot_as_file('foo.png') time.sleep(10) #driver.quit() # 使用完, 記得關閉瀏覽器, 不然chromedriver.exe進程為一直在內存中.
3、讀取使用cookie:
from selenium import webdriver import time import json driver = webdriver.Chrome() # 創建Chrome對象. driver.get('https://mp.qutoutiao.net') fr=open('cookie.txt','r') cookielist=json.load(fr) fr.close() for cookie in cookielist: driver.add_cookie(cookie) # 操作這個對象. driver.get('https://mp.qutoutiao.net') # get方式訪問 time.sleep(1) #driver.get_screenshot_as_file('foo.png') #time.sleep(10) #driver.quit() # 使用完, 記得關閉瀏覽器, 不然chromedriver.exe進程為一直在內存中.
4、登錄完成,開始干活
#-*-coding:utf-8-*- from selenium import webdriver import time import json driver = webdriver.Chrome() # 創建Chrome對象. driver.maximize_window() # 操作這個對象. driver.get('https://mp.***.net') # get方式訪問 time.sleep(5) el = driver.find_element_by_xpath("//input[@type='text']") el.send_keys('****') time.sleep(2) el = driver.find_element_by_xpath("//input[@type='password']") el.send_keys('*****') time.sleep(2) el = driver.find_element_by_id("submit-login") el.click() time.sleep(2) #獲取網站cookie diccookie=driver.get_cookies() fw=open('cookie.txt','w') json.dump(diccookie,fw) fw.close() el = driver.find_element_by_class_name("shadow-close") el.click() time.sleep(2) #滾動到瀏覽器頂部 js_top = "var q=document.documentElement.scrollTop=0" #滾動到瀏覽器底部 js_bottom = "var q=document.documentElement.scrollTop=10000" js_bottom2 = "window.scrollTo(0,document.body.scrollHeight)" driver.execute_script(js_top) el = driver.find_element_by_class_name("sub-child-txt") el.click() time.sleep(2) el = driver.find_element_by_xpath('//div[@class="content-header"]/div/p[3]') el.click() time.sleep(2) #article 圖文1,3 video視頻2,4 el = driver.find_element_by_xpath('//div[@class="content-article"]/div/p[4]') el.click() time.sleep(2) for i in range(1,100): try: el = driver.find_element_by_class_name("icon-delete") el.click() time.sleep(2) el = driver.find_element_by_class_name("el-button--primary") el.click() time.sleep(2) #driver.refresh() except: pass #print(txt) #driver.get_screenshot_as_file('foo.png') time.sleep(10) #driver.quit() # 使用完, 記得關閉瀏覽器, 不然chromedriver.exe進程為一直在內存中.