简单 python 爬虫(爬取小说网)


#https://blog.csdn.net/Isana_Yashiro/article/details/84582946
import requests
from bs4 import BeautifulSoup
target = 'https://www.biqukan.com/1_1094/5403177.html'
req = requests.get(url=target)
req.encoding='GBK'
html = req.text
soup = BeautifulSoup(html, 'html.parser')
texts = soup.select('.showtxt')
print(texts[0].text.replace(' ', '\n').replace('\xa0'*8, '\n'))


#有道翻译
import requests        #导入requests包
import json
def get_translate_date(word=None):
url = 'http://fanyi.youdao.com/translate?smartresult=dict&smartresult=rule'
From_data={'i':word,'from':'AUTO','to':'AUTO','smartresult':'dict','client':'fanyideskweb','salt':'15885798599693','sign':'f0571e9e3db6fecdcc228d7c7294e362','ts':'1588579859969','bv':'9d1e6a4f9d4241fb7947f623cc9e4efa','doctype':'json','version':'2.1','keyfrom':'fanyi.web','action':'FY_BY_REALTIME','typoResult':'false'}
#请求表单数据
response = requests.post(url,data=From_data)
#将Json格式字符串转字典
content = json.loads(response.text)
print(content)
#打印翻译后的数据
print(content['translateResult'][0][0]['tgt'])
if __name__=='__main__':
get_translate_date('我爱中国')
posted @ 2020-05-04 19:29  杨广伟9527  阅读(620)  评论(0编辑  收藏  举报