Python Selenium与Requests session会话互相同步

一:背景

最近有朋友问,如何将selenium的session会话同步给requests,因此写一下selenium与request session会话互相同步。

二:Selenium同步到requests

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
import requests
from selenium import webdriver

webapi = webdriver.Chrome()
webapi.implicitly_wait(10)  #全局等待10s
webapi.get('https://book.douban.com/')   #通过selenium登录豆瓣读书首页
sel_cookies = webapi.get_cookies()  #获取selenium侧的cookies
print sel_cookies
jar = requests.cookies.RequestsCookieJar()  #先构建RequestsCookieJar对象
for i in sel_cookies:
    #将selenium侧获取的完整cookies的每一个cookie名称和值传入RequestsCookieJar对象
    #domain和path为可选参数,主要是当出现同名不同作用域的cookie时,为了防止后面同名的cookie将前者覆盖而添加的
    jar.set(i['name'], i['value'],domain=i['domain'],path=i['path'])  

session = requests.session()   #requests以session会话形式访问网站
session.cookies.update(jar) #将配置好的RequestsCookieJar对象加入到requests形式的session会话中
print session.cookies
url = 'https://book.douban.com/subject/4913064/'
headers = {'User-Agent':'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.75 Safari/537.36'}
req = requests.Request(method='GET', url=url, headers=headers)
rpe = session.send(session.prepare_request(req),
                    verify=False,# verify设置为False来规避SSL证书验证
                    timeout=10)  
print session.cookies    #此时的cookies同步为selenium侧的cookies

三:requests同步到Selenium

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
import requests
from selenium import webdriver

session = requests.session()   #requests以session会话形式访问网站
url = 'https://book.douban.com/subject/4913064/'
headers = {'User-Agent':'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.75 Safari/537.36'}
req = requests.Request(method='GET', url=url, headers=headers)
rpe = session.send(session.prepare_request(req),
                    verify=False,# verify设置为False来规避SSL证书验证
                    timeout=10)  
print session.cookies

webapi = webdriver.Chrome()
webapi.implicitly_wait(10)  #全局等待10min
webapi.get(url)  
print webapi.get_cookies()  #此时的selenium侧的cookies
webapi.delete_all_cookies() #删除selenium侧的所有cookies
for k,v in session.cookies.items(): #获取requests侧的cookies
    webapi.add_cookie({'name':k,'value':v})    #向selenium侧传入以requests侧cookies的name为键value为值的字典
print webapi.get_cookies()  #此时的cookies同步为requests侧的cookies