Python基于JWT网站的模拟登陆和爬取
import requests from urllib.parse import urljoin BASE_URL = 'https://login3.scrape.cuiqingcai.com/' LOGIN_URL = urljoin(BASE_URL, '/api/login') INDEX_URL = urljoin(BASE_URL, '/api/book') USERNAME = 'admin' PASSWORD = 'admin' response_login = requests.post(LOGIN_URL, json={ 'username': USERNAME, 'password': PASSWORD }) data = response_login.json() print('Response JSON', data) jwt = data.get('token') print('JWT', jwt) headers = { 'Authorization': f'jwt {jwt}' } response_index = requests.get(INDEX_URL, params={ 'limit': 18, 'offset': 0 }, headers=headers) print('Response Status', response_index.status_code) print('Response URL', response_index.url) print('Response Data', response_index.json())
目前这个例子可能运行不起来,因为网站的登录有问题
来自拉勾教育 52讲轻松搞定网络爬虫