【python】爬虫

# 国外路径 pip install request
# 国内源镜像路径(清华） pip install -i https://pypi.tuna.tsinghua.edu.cn/simple requests

import requests

key=input("请输入你要查询的内容:")
url = f"http://www.sogo.com/web?query={key}"
header = {
    "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_6) AppleWebKit/537.36 (KHTML, like Gecko)"
                  "Chrome/99.0.4844.74 Safari/537.36"
}

resp = requests.get(url, headers=header) #处理了一个小小的反爬

print(resp)
print(resp.text)  # 拿到页面源代码

import requests as requests

url = "https://fanyi.baidu.com/sug"
value = input("请输入关键字：")
keyword = {
    "kw": value
}
# 发送post请求，发送的数据请求必须在字典中，通过data参数进行传递
resp = requests.post(url, data=keyword)
print(resp.json())  #将服务器返回的内容直接转换成json格式

import requests

url = "https://movie.douban.com/j/chart/top_list"

param = {
    "type": 24,
    "interval_id": "100:90",
    "action": "",
    "start": 0,
    "limit": 20
}
headers = {
    "User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_6) AppleWebKit/537.36 (KHTML, like Gecko)"
                  "Chrome/99.0.4844.74 Safari/537.36"
}

resp = requests.get(url=url, params=param, headers=headers)
# print(resp.request.url)   #检查url是否正确

# 把结果存到文件中
with open("豆瓣喜剧电影.txt", mode="w") as f:
    f.write(str(resp.json()))

# 关闭文件
f.close()
# 爬完一定要关闭
resp.close()

posted @ 2022-05-14 17:55 hanyr 阅读(33) 评论(0) 编辑收藏举报

刷新页面返回顶部

登录后才能查看或发表评论，立即登录或者逛逛博客园首页

相关博文：

· 【python】爬虫

· 【爬虫】下载图片

· Python爬虫

· 爬虫-初试

· 03、Python爬虫程序说明

公告

昵称： hanyr
园龄： 9年11个月
粉丝： 0
关注： 2

+加关注

2025年3月

日

一

二

三

四

五

六

【python】爬虫

公告

搜索

常用链接

我的标签

随笔分类

随笔档案

阅读排行榜