#對反爬蟲網頁,可以設置一些headers信息,模擬成瀏覽器取訪問網站
import urllib.request
url="https://www.baidu.com/"
file=urllib.request.urlopen(url)
# print('獲取當前url:',file.geturl() )
# print('file.getcode,HTTPResponse類型:',file.getcode )
print('file.info 返回當前環境相關的信息:' ,file.info())
cookie 獲取一
# 導入模塊
from selenium import webdriver
driver = webdriver.Chrome(executable_path='D:\chromedriver\chromedriver')
url = "https://www.baidu.com"
driver.get(url)
# 獲取cookie列表
cookie_list = driver.get_cookies()
# 格式化打印cookie
# print(cookie_list)
cookie_dict = {}
cookie = ''
for cookie in cookie_list:
cookie_dict[cookie['name']] = cookie['value']
print(cookie_dict)
driver.quit()
cookie 獲取二
import requests
def Get_Cookie(url):
session = requests.Session()
headers = {
'user-agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/604.1.38 (KHTML, like Gecko) Version/11.0 Mobile/15A372 Safari/604.1'
}
req = session.get(url, headers=headers, verify=True)
# 獲取當前的Cookie
Cookie = dict(session.cookies)
# print(Cookie)
return Cookie
cookie = ''
coo = Get_Cookie('https://www.baidu.com/')
# print(coo)
for index, key in enumerate(coo):
cookie = cookie + (key + '=' + coo[key] + ';')
# print(coo[key])
print(cookie)
cookie 獲取三
# python3.6環境
from urllib import request
from http import cookiejar
if __name__ == '__main__':
# 聲明一個CookieJar對象實例來保存cookie
cookie = cookiejar.CookieJar()
# 利用urllib.request庫的HTTPCookieProcessor對象來創建cookie處理器,也就CookieHandler
handler = request.HTTPCookieProcessor(cookie)
# 通過CookieHandler創建opener
opener = request.build_opener(handler)
# 此處的open方法打開網頁
response = opener.open('https://blog.csdn.net/t8116189520/article/details/80319339')
# 打印cookie信息
for item in cookie:
print('Name = %s' % item.name)
print('Value = %s' % item.value)