返回顶部

自动 构建获取USER_AGENT 和 PROXY_LIST

 1 import json
 2 '''
 3 打开网页,直接保存网页proxy_list.txt ,然后用工具将其处理为 json 文件!   
 4 '''
 5 with open("proxy_list.json","r",encoding="utf8") as f:
 6     data_lists = json.load(f)
 7 
 8 final_data = []
 9 for data_dict in data_lists :
10     address_sets = set(data_dict["export_address"])  #变为 set 去重
11     port = data_dict["port"]
12     type =data_dict["type"]
13     # print(address_sets)
14     for address in address_sets:
15         temp = {type :address + ":" + str(port)}
16         # print(temp)
17         final_data.append(temp)
18 with open("PROXY_LISTS.json","a+",encoding="utf8") as f:
19     json.dump(final_data,f)
20     print(len(final_data))
View Code
 1 import json
 2 final_data = []
 3 with open("PROXY_LISTS.json","r",encoding="utf8") as f:
 4     temp = []
 5     data_lists = json.load(f)
 6     for data_dict in data_lists:
 7         key_str = list(data_dict.keys())[0]
 8         val_str = list(data_dict.values())[0]
 9         d = key_str + val_str
10         print(d)
11         if d in temp:
12             continue
13         temp.append(d)
14         final_data.append(data_dict)
15 with open("PROXY_LISTS.json","w",encoding="utf8") as f:
16     json.dump(final_data,f)
给PROXY_LISTS.json文件去重!
 
 
 1 '''
 2 
 3 l1 = []
 4 l2 =[]
 5 l3 =[]
 6 s = []
 7 with open("a.txt","r",encoding="gbk") as f:
 8     for line in f:
 9         s.append(line.strip("\n"))
10 
11     print(s)
12     for j in range(0,18,3):
13         print(j)   #0 3 6 9
14 
15         a = 100*j
16         b = a +100
17         for i in range(a,b):
18             l1.append(s[i])
19         for i in range(b,b+100):
20             l2.append(s[i])
21         for i in range(b+100,b+200):
22             l3.append(s[i])
23 
24 
25     print(l1)
26     print(l2)
27     print(l3)
28 
29 {"http": "3.14.247.230:8080"}
30 
31 '''
32 # b =['49.70.48.72', '183.164.238.126', '223.198.17.183', ' 600 
33 # c = ['9999', '9999', '9999', '9999', '9999', '9999', '    600 
34 # d =['HTTP', 'HTTP', 'HTTP', 'HTTP', 'HTTP', 'HTTPS',      600 
35 
36 data_dict = []  # 里面元素是 {}
37 for i in range(600):
38     temp = {}
39     temp[d[i]] = b[i] +":"+c[i]
40     data_dict.append(temp)
41 print(data_dict)
View Code

 

posted @ 2019-12-16 02:05  Zcb0812  阅读(310)  评论(0编辑  收藏  举报