• requests库的get请求(加上head,加上get参数请求)


    #coding:utf-8
    # 导入requests
    import requests
    
    # 构建url
    url = 'http://www.baidu.com'
    
    # 发送请求,获取响应
    # response = requests.get(url)
    response = requests.head(url)
    
    # 检查状态码
    # print (response.status_code)
    
    # 检查url
    # print (response.url)
    
    # 检查请求头
    # print (response.request.headers)
    
    # 检查响应头
    # print (response.headers)
    
    # 检查源码
    # print (response.content)
    # print (response.content.decode())
    #
    # response.encoding='utf-8'
    # print (response.text)
    # print (response.encoding)
    

      带headers的请求

    #coding:utf-8
    import requests
    import time
    
    # 构建url
    url = 'http://www.baidu.com'
    
    # 构建请求头
    headers = {
        'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_12_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/62.0.3202.89 Safari/537.36'
    }
    
    
    # 发送请求
    response = requests.get(url, headers=headers)
    print (len(response.content))
    
    time.sleep(2)
    response1 = requests.get(url)
    print (len(response1.content))
    

      

    带get传参的请求

    #coding:utf-8
    import requests
    
    # 构建url
    url = 'https://www.baidu.com/s'
    # 构建headers
    headers = {
        'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_12_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/62.0.3202.89 Safari/537.36'
    }
    
    # 构建参数
    params = {
        "wd": "深圳"
    }
    
    # 发送请求
    response = requests.get(url, headers=headers, params=params)
    
    # 验证url
    # print(response.url)
    
    with open('baidu.html','w')as f:
        f.write(response.content.decode())
    

    get带有代理的请求:

    #coding:utf-8
    import requests
    
    # 构建一个url
    url = 'http://www.itcast.cn'
    # 构建headers
    headers = {
                'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_12_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/62.0.3202.89 Safari/537.36'
            }
    # 构建代理
    # proxies = {
    #     "http": "http://106.14.51.145:8118",
    #     "https": "https://106.14.51.145:8118",
    # }
    # 付费代理
    proxies = {
        "http": "http://morganna_mode_g:ggc22qxp@117.48.199.230:16816",
        "https": "https://morganna_mode_g:ggc22qxp@117.48.199.230:16816",
    }
    
    # 发送请求
    response = requests.get(url,headers=headers,proxies=proxies)
    
    
    #? 如何验证代理是否使用成功
    # 运用超时抛出异常来判断是否成功,一般0.5-1秒
    # response = requests.get(url, timeout=3)

      

  • 相关阅读:
    Python进程池
    Python进程间通信
    python编程中的if __name__ == 'main与windows中使用多进程
    Python进程-实现
    python进程join()函数理解
    python 进程池Pool
    python多进程打印字符,加锁(Lock加锁)
    python进程、多进程
    正则表达式统计字符串中数字的个数
    python 处理xml
  • 原文地址:https://www.cnblogs.com/andy9468/p/8306749.html
Copyright © 2020-2023  润新知