PySide2,爬虫,笔趣阁小说下载神器,python
基于PySide2和requests库,自行编写了一个下载笔趣阁小说的小软件,主要是练习写程序用。这个小程序里用到的基本知识点很多
包括PySide2,爬虫,多线程等,这个小程输入小说网址和小说名后会自动下载全本小说,保存在目录中。程序的界面用Qtdesigner生成,程序运行效果如下 :
界面中各控件的变量名分别 是:小说网址--novelAddr; 小说名字---novelName; 开始下载按钮:start_Button;显示信息控件out_info
下面附上全部代码:
import requests from lxml import etree import os from PySide2.QtUiTools import QUiLoader from PySide2.QtCore import * from PySide2.QtWidgets import * from PySide2.QtGui import QIcon from threading import Thread class Novel(): def __init__(self): qfile_stats = QFile('novel.ui') qfile_stats.open(QFile.ReadOnly) qfile_stats.close() self.ui = QUiLoader().load(qfile_stats) self.ui.start_Button.clicked.connect(self.get_info) def get_info(self): self.addr_head = 'http://www.xbiquge.la' self.novel_name = self.ui.novelName.text() self.novel_addr = self.ui.novelAddr.text() # 自动创建小说文件夹并进入文件夹 if not os.path.exists(self.novel_name): os.makedirs(self.novel_name) os.chdir(os.getcwd() + '/' + self.novel_name) else: os.chdir(os.getcwd() + '/' + self.novel_name) self.start() def start(self): th = Thread(target=self.get_text) th.start() # 设置要攫取小说的函数功能 def get_text(self): # 设置请求头 headers = { 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/88.0.4324.96 Safari/537.36 Edg/88.0.705.53'} response = requests.get(self.novel_addr, headers=headers) response.encoding = 'utf-8' # response.encoding = 'gbk' # 有的网站要求使用gbk编码 selector = etree.HTML(response.text) # 获取章节标题 title = selector.xpath('//*[@id="list"]/dl/dd/a/text()') # dd[0]是第1章....dd则是整个列表 # ('//*[@id="list"]/dl/dd[23]/a/text()') /text之前的内容是在网站上复制XPath得来的,加上/text()方法是获得此链接标题 # 获取各章具体链接 hrefs = selector.xpath('//*[@id="list"]/dl/dd/a/@href') # 获得href属性值的列表 web_list = [self.addr_head + i for i in hrefs] for i in range(len(web_list)): response = requests.get(web_list[i], headers=headers) response.encoding = 'utf-8' selector = etree.HTML(response.text) # 获取各章具体内容 contents = selector.xpath('//*[@id="content"]/text()') # 保存章节名称及内容 with open(self.novel_name + '.txt', 'a', encoding='utf-8') as f: self.ui.out_info.append(f'正在下载并保存 {title[i]}......') print(f'正在下载并保存 {title[i]}......') f.write('\n' + title[i] + '\n') for content in contents: content = content.replace("\r', '\r'", '') f.write(content) print('完成副本小说下载!!!') app = QApplication([]) app.setWindowIcon(QIcon('./E1.png')) first = Novel() first.ui.show() app.exec_()