写爬虫的时候免不了操作Cookies,使用Selenium可以很方便的读取浏览器已有Cookies,管理Cookies也很方便。
1.selenium读取浏览器已有Cookies
from selenium import webdriver
options = webdriver.ChromeOptions()
options.add_argument("user-data-dir=C:\\Users\\HN\\AppData\\Local\\Google\\Chrome\\User Data")
options.add_experimental_option("excludeSwitches",["ignore-certificate-errors"])
driver = webdriver.Chrome(executable_path="C:/chromedriver.exe",options=options)
driver.maximize_window()
driver.get('https://www.weibo.com')
print(driver.get_cookies())
2.selenium保存cookies
#coding=utf-8
from selenium import webdriver
import pickle
import time
driver = webdriver.Chrome(executable_path="C:/chromedriver.exe")
driver.maximize_window()
driver.get('https://www.douban.com')
time.sleep(60)
cookies = driver.get_cookies()
with open('D:/test_cookies/db_cookie_1','wb') as f:
pickle.dump(cookies,f)
print ('done')
#coding=utf-8
from selenium import webdriver
import pickle
import time
driver = webdriver.Chrome(executable_path="C:/chromedriver.exe")
#不带cookies访问豆瓣
driver.get('https://www.douban.com')
#删掉cookies
driver.delete_all_cookies()
with open('D:/test_cookies/db_cookie_1','rb') as f:
cookies = pickle.load(f)
for cookie in cookies:
driver.add_cookie(cookie)
print(cookie)
#带我们保存的cookie访问豆瓣
driver.get('https://www.douban.com')
print('done')