zoukankan      html  css  js  c++  java
  • 自动 构建获取USER_AGENT 和 PROXY_LIST

     1 import json
     2 '''
     3 打开网页,直接保存网页proxy_list.txt ,然后用工具将其处理为 json 文件!   
     4 '''
     5 with open("proxy_list.json","r",encoding="utf8") as f:
     6     data_lists = json.load(f)
     7 
     8 final_data = []
     9 for data_dict in data_lists :
    10     address_sets = set(data_dict["export_address"])  #变为 set 去重
    11     port = data_dict["port"]
    12     type =data_dict["type"]
    13     # print(address_sets)
    14     for address in address_sets:
    15         temp = {type :address + ":" + str(port)}
    16         # print(temp)
    17         final_data.append(temp)
    18 with open("PROXY_LISTS.json","a+",encoding="utf8") as f:
    19     json.dump(final_data,f)
    20     print(len(final_data))
    View Code
     1 import json
     2 final_data = []
     3 with open("PROXY_LISTS.json","r",encoding="utf8") as f:
     4     temp = []
     5     data_lists = json.load(f)
     6     for data_dict in data_lists:
     7         key_str = list(data_dict.keys())[0]
     8         val_str = list(data_dict.values())[0]
     9         d = key_str + val_str
    10         print(d)
    11         if d in temp:
    12             continue
    13         temp.append(d)
    14         final_data.append(data_dict)
    15 with open("PROXY_LISTS.json","w",encoding="utf8") as f:
    16     json.dump(final_data,f)
    给PROXY_LISTS.json文件去重!
     
     
     1 '''
     2 
     3 l1 = []
     4 l2 =[]
     5 l3 =[]
     6 s = []
     7 with open("a.txt","r",encoding="gbk") as f:
     8     for line in f:
     9         s.append(line.strip("
    "))
    10 
    11     print(s)
    12     for j in range(0,18,3):
    13         print(j)   #0 3 6 9
    14 
    15         a = 100*j
    16         b = a +100
    17         for i in range(a,b):
    18             l1.append(s[i])
    19         for i in range(b,b+100):
    20             l2.append(s[i])
    21         for i in range(b+100,b+200):
    22             l3.append(s[i])
    23 
    24 
    25     print(l1)
    26     print(l2)
    27     print(l3)
    28 
    29 {"http": "3.14.247.230:8080"}
    30 
    31 '''
    32 # b =['49.70.48.72', '183.164.238.126', '223.198.17.183', ' 600 
    33 # c = ['9999', '9999', '9999', '9999', '9999', '9999', '    600 
    34 # d =['HTTP', 'HTTP', 'HTTP', 'HTTP', 'HTTP', 'HTTPS',      600 
    35 
    36 data_dict = []  # 里面元素是 {}
    37 for i in range(600):
    38     temp = {}
    39     temp[d[i]] = b[i] +":"+c[i]
    40     data_dict.append(temp)
    41 print(data_dict)
    View Code
  • 相关阅读:
    Dapper ORM 用法—Net下无敌的ORM(转)
    微軟将从 .NET 4 以后的版本弃用 System.Data.OracleClient 以及Oracle 的各种连接方法
    最火的.NET开源项目
    sql日期格式化
    项目失败总结
    C#,往线程里传参数的方法总结
    线程的几种用法
    小程序api-01-abcdefg
    cnpm
    关于mpvue和wafer2-client-sdk的 微信登录失败,请检查网络状态
  • 原文地址:https://www.cnblogs.com/zach0812/p/12046742.html
Copyright © 2011-2022 走看看