selenium模擬登陸,然後再用Requests爬取
阿新 • • 發佈:2021-08-24
selenium模擬登陸,然後再用Requests爬取
from urllib.parse import urljoin from selenium import webdriver import requests import time BASE_URL = 'https://login2.scrape.center/' LOGIN_URL = urljoin(BASE_URL, '/login/') INDEX_URL = urljoin(BASE_URL, '/page/1') USERNAME = 'admin' PASSWORD = 'admin' browser = webdriver.Chrome() browser.get(BASE_URL) browser.find_element_by_css_selector('input[name="username"]').send_keys(USERNAME) browser.find_element_by_css_selector('input[name="password"]').send_keys(PASSWORD) browser.find_element_by_css_selector('input[type="submit"]').click() time.sleep(10) # get cookies from selenium cookies = browser.get_cookies() print('Cookies', cookies) browser.close()# set cookies to requests session = requests.Session() for cookie in cookies: session.cookies.set(cookie['name'], cookie['value']) response_index = session.get(INDEX_URL) print('Response Status', response_index.status_code) print('Response URL', response_index.url)
來自拉勾教育52講輕鬆搞定網路爬蟲