Python3 requests库基本使用

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
'''
    对urllib库进行了封装,更简单的get,post请求方式
    json数据处理
    添加请求头headers
    POST,GET 请求发送
    文件上传
    跳过证书验证, 忽略警告
    网页需要登录用户名密码
    响应状态码
    请求响应异常处理
    response属性
    会话保持 (cookie保持)
'''
 
# 底层依赖urllib
import requests
 
#########各种请求方式
# requests.post('http://httpbin.org/post')
# requests.put('http://httpbin.org/put')
# requests.delete('http://httpbin.org/delete')
# requests.head('http://httpbin.org/get')
# requests.options('http://httpbin.org/get')
######## 发送一个get请求,带参数
# data = {
#     'name': 'kaige',
#     'age': 22
# }
# response = requests.get('http://httpbin.org/get', params=data)
# print(response.text)  # 响应内容
# 如果返回json对象用 .json()接收
# response.json() # 等价于  json.loads(response.text)
# 获取二进制数据
# response.content
# 保存二进制数据
# with open('xxx.ico二进制是什么格式打开什么格式','wb') as f:
#     f.write(response.content)
#     f.close()
# -------------------------------------
# 添加headers ########
# response = requests.get('https://www.zhihu.com/explore')  # 拒绝访问
# print(response.text)
# headers = {
#     'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.181 Safari/537.36'
# }
# response = requests.get('https://www.zhihu.com/explore',headers=headers)
# print(response.text)
 
# -------------------------post请求
# 基本请求带参, 加入headers 和get方式一样
# data = {
#     'name': 'kaige', 'age': 22
# }
# response = requests.post('http://httpbin.org/post', data=data)
# print(response.text)
 
# ---------------------------response 的属性
# response = requests.get('http://www.jianshu.com')
# print(type(response.status_code), response.status_code)  # 状态码
# print(type(response.headers), response.headers)  # 头
# print(type(response.cookies), response.cookies)  # cookie
# print(type(response.url), response.url)  # url
# print(type(response.history), response.history)
 
# ----------------------------状态码判断
import requests
# response = requests.get('http://www.jianshu.com/hello.html')
# exit() if not response.status_code == requests.codes.not_found else print('404 Not Found')
# exit() if not response.status_code == 404 else print('404 Not Found')
# print(response.status_code)  # 也可以直接判断状态码, 官网查询
 
 
 
# ------------------------- 文件上传
# import requests
# files = {'file': open('favicon.ico', 'rb')}
# response = requests.post('http://httpbin.org/post', files=files)
# print(response.text)
 
# ------------------------ 获取cookie
# import requests
# response = requests.get('https://www.baidu.com')
# print(response.cookies)
# for key,value in response.cookies.items():
#     print(key, value)
# -------------------------  会话维持
# import requests
# s = requests.Session()  # 发送一个post, s.post(), 相当在一个游览器操作
# s.get('http://httpbin.org/cookies/set/number/123456789')
# response = s.get('http://httpbin.org/cookies')
# print(response.text)
 
# -----------------------------证书验证
# import requests
# 证书不安全,访问失败, 设置verify=False,跳过证书验证, 但是还是有警告,可以用requests.pachages import rullib3.disable_warnings() 消除警告
# from requests.packages import urllib3
#
# urllib3.disable_warnings()
# response = requests.get('https://www.12306.cn', verify=False)
# print(response.status_code)
 
# 指定证书验证
# requests.get('https://www.12306.cn', cert=('xxx.crt', 'xxx/key'))
 
 
# ----------------------------- 代理设置
# import requests
# proxies = {
#     'http': 'http://xxx.xx.xx.x:xxxx',
#     'https': 'https://111.1.1.1:2222',
# }
# response = requests.get('https://www.taobao.com', proxies=proxies)
# print(response.status_code)
######### 代理有用户名密码
# import requests
# proxies = {
#     'http': 'http://user:password@111.11.1.1:2222',
# }
# response = requests.get('https://www.taobao.com', proxies=proxies)
# print(response)
##########  socks代理
# pip install 'requests[socks]'
# proxies = {
#     'http': 'socks5://111.1.1.1:2222',
# } 同上
# ------------------------------ 超时设置timeout
# import requests
# from requests.exceptions import ReadTimeout,Timeout
# try:
#     response = requests.get('https://www.baidu.com', timeout= 0.01)
#     print(response.status_code)
# except Timeout:
#     print('Timeout')
 
# ---------------------- 认证设置(访问网站需要登录)
# import requests
# r = requests.get('http://120.27.34.24:9001', auth=('user', '123'), timeout=1)
# print(r.status_code)
 
# ---------------------------  异常处理
import requests
from requests.exceptions import HTTPError, RequestException, ReadTimeout, Timeout
try:
    response = requests.get('http://httpbin.org/get', timeout=0.01)
    print(response.status_code)
except Timeout:
    print('TImeout')
except HTTPError:
    print('http err')
except RequestException:
    print('父类异常')

  

posted @   qukaige  阅读(312)  评论(0编辑  收藏  举报
编辑推荐:
· .NET Core 中如何实现缓存的预热?
· 从 HTTP 原因短语缺失研究 HTTP/2 和 HTTP/3 的设计差异
· AI与.NET技术实操系列:向量存储与相似性搜索在 .NET 中的实现
· 基于Microsoft.Extensions.AI核心库实现RAG应用
· Linux系列:如何用heaptrack跟踪.NET程序的非托管内存泄露
阅读排行:
· TypeScript + Deepseek 打造卜卦网站:技术与玄学的结合
· 阿里巴巴 QwQ-32B真的超越了 DeepSeek R-1吗?
· 【译】Visual Studio 中新的强大生产力特性
· 【设计模式】告别冗长if-else语句:使用策略模式优化代码结构
· 10年+ .NET Coder 心语 ── 封装的思维:从隐藏、稳定开始理解其本质意义
点击右上角即可分享
微信分享提示