import requests
from lxml import etree
import pandas as pd
import time
url = "http://www.66ip.cn/index.html"
headers = {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/108.0.0.0 Safari/537.36"}
all_ip = []
all_duankou = []
all_adress = []
all_iptype = []
all_yz_time = []
num = 1
while True:
if num == 2991:
break
try:
res = requests.get(url, headers=headers, timeout=10)
except:
continue
res.encoding = "gbk"
e = etree.HTML(res.text)
ip = e.xpath("//table/tr/td[1]/text()")
duankou = e.xpath("//table/tr/td[2]/text()")
adress = e.xpath("//table/tr/td[3]/text()")
iptype = e.xpath("//table/tr/td[4]/text()")
yz_time = e.xpath("//table/tr/td[5]/text()")
num += 1
url = "http://www.66ip.cn/" + str(num) + ".html"
all_ip.extend(ip[3:])
all_duankou.extend(duankou[1:])
all_adress.extend(adress[1:])
all_iptype.extend(iptype[1:])
all_yz_time.extend(yz_time[1:])
time.sleep(1)
print(url)
df = pd.DataFrame({"ip": all_ip, "端口号": all_duankou, "代理位置": all_adress, "代理类型": all_iptype, "验证时间": all_yz_time})
df.to_excel(r"C:\Users\44281\Desktop\海量IP.xlsx", index=False)
【推荐】国内首个AI IDE,深度理解中文开发场景,立即下载体验Trae
【推荐】编程新体验,更懂你的AI,立即体验豆包MarsCode编程助手
【推荐】抖音旗下AI助手豆包,你的智能百科全书,全免费不限次数
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· 震惊!C++程序真的从main开始吗?99%的程序员都答错了
· 【硬核科普】Trae如何「偷看」你的代码?零基础破解AI编程运行原理
· 单元测试从入门到精通
· 上周热点回顾(3.3-3.9)
· Vue3状态管理终极指南:Pinia保姆级教程