zoukankan      html  css  js  c++  java
  • 获取免费IP--代码--转

    #! /usr/bin/env python3
    from urllib import request
    import random
    import time
    import lxml
    import re



    user_agent_list = [
    'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) '
    'Chrome/45.0.2454.85 Safari/537.36 115Browser/6.0.3',
    'Mozilla/5.0 (Macintosh; U; Intel Mac OS X 10_6_8; en-us) AppleWebKit/534.50 (KHTML, like Gecko) Version/5.1 Safari/534.50',
    'Mozilla/5.0 (Windows; U; Windows NT 6.1; en-us) AppleWebKit/534.50 (KHTML, like Gecko) Version/5.1 Safari/534.50',
    'Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0; Trident/4.0)',
    'Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.0)',
    'Mozilla/5.0 (Windows NT 6.1; rv:2.0.1) Gecko/20100101 Firefox/4.0.1',
    'Opera/9.80 (Windows NT 6.1; U; en) Presto/2.8.131 Version/11.11',
    'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_0) AppleWebKit/535.11 (KHTML, like Gecko) Chrome/17.0.963.56 Safari/535.11',
    'Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; Trident/4.0; SE 2.X MetaSr 1.0; SE 2.X MetaSr 1.0; .NET CLR 2.0.50727; SE 2.X MetaSr 1.0)',
    'Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0',
    'Mozilla/5.0 (Windows NT 6.1; rv:2.0.1) Gecko/20100101 Firefox/4.0.1',
    ]

    count = 0

    def Get_proxy_ip():
    headers = {
    'Host': 'www.xicidaili.com',
    'User-Agent':'Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.0)',
    'Accept': r'application/json, text/javascript, */*; q=0.01',
    'Referer': r'http://www.xicidaili.com/',
    }
    req = request.Request(r'http://www.xicidaili.com/nn/', headers=headers)
    response = request.urlopen(req)
    html = response.read().decode('utf-8')
    proxy_list = []
    ip_list = re.findall(r'd+.d+.d+.d+',html)
    port_list = re.findall(r'<td>d+</td>',html)
    for i in range(len(ip_list)):
    ip = ip_list[i]
    port = re.sub(r'<td>|</td>', '', port_list[i])
    proxy = '%s:%s' %(ip,port)
    proxy_list.append(proxy)
    return proxy_list

    def Proxy_read(proxy_list, user_agent_list, i):
    proxy_ip = proxy_list[i]
    print('当前代理ip:%s'%proxy_ip)
    user_agent = random.choice(user_agent_list)
    print('当前代理user_agent:%s'%user_agent)
    sleep_time = random.randint(1,3)
    print('等待时间:%s s' %sleep_time)
    time.sleep(sleep_time)
    print('开始获取')
    headers = {
    'Host': 's9-im-notify.csdn.net',
    'Origin':'http://blog.csdn.net',
    'User-Agent': user_agent,
    'Accept': r'application/json, text/javascript, */*; q=0.01',
    'Referer': r'http://blog.csdn.net/u010620031/article/details/51068703',
    }

    proxy_support = request.ProxyHandler({'http':proxy_ip})
    opener = request.build_opener(proxy_support)
    request.install_opener(opener)

    req = request.Request(r'http://blog.csdn.net/u010620031/article/details/51068703',headers=headers)
    try:
    html = request.urlopen(req).read().decode('utf-8')
    except Exception as e:
    print('******打开失败!******')
    else:
    global count
    count +=1
    print('OK!总计成功%s次!'%count)

    if __name__ == '__main__':
    proxy_list = Get_proxy_ip()
    for i in range(100):
    Proxy_read(proxy_list, user_agent_list, i)

    代理网站

    https://link.jianshu.com?t=http://www.cz88.net/proxy/
    https://link.jianshu.com?t=http://www.66ip.cn/index.html 
    https://link.jianshu.com?t=http://www.xicidaili.com/
    https://link.jianshu.com?t=http://www.coobobo.com/
    https://link.jianshu.com?t=http://www.kuaidaili.com/
    https://link.jianshu.com?t=http://www.proxy360.cn/default.aspx
    https://link.jianshu.com?t=http://ip.zdaye.com/
    https://link.jianshu.com?t=https://www.us-proxy.org/
    https://link.jianshu.com?t=http://www.nianshao.me/
    https://link.jianshu.com?t=http://www.goubanjia.com/
    https://link.jianshu.com?t=http://www.iphai.com/
    https://link.jianshu.com?t=http://www.meiridaili.com/
    https://link.jianshu.com?t=http://www.swei360.com/free/
    https://link.jianshu.com?t=http://www.89ip.cn/
    https://link.jianshu.com?t=http://www.ip3366.net/
    https://link.jianshu.com?t=http://www.mimiip.com/
    https://link.jianshu.com?t=http://daili.wy96.com/page1.asp
    https://link.jianshu.com?t=http://ip.qiaodm.com/free/index.html
    https://link.jianshu.com?t=http://www.ip181.com/
    https://link.jianshu.com?t=http://www.httpsdaili.com/free.asp
    https://link.jianshu.com?t=http://proxy.mimvp.com/free.php
    https://link.jianshu.com?t=http://www.httpdaili.com/mfdl/
    https://link.jianshu.com?t=http://www.mayidaili.com/free
    https://link.jianshu.com?t=http://www.fengyunip.com/free/china-high.html
    https://link.jianshu.com?t=http://www.kxdaili.com/dailiip.html
    https://link.jianshu.com?t=http://www.xdaili.cn/freeproxy
    https://link.jianshu.com?t=http://www.superfastip.com/welcome/getips
    https://link.jianshu.com?t=http://www.chinabaike.com/t/10475/2016/0530/5239251.html

    纯真
    66免费代理网
    西刺免费代理IP
    酷伯伯HTTP代理
    快代理
    proxy360.cn
    站大爷
    Free Proxy List
    年少
    全网代理IP
    IP海
    每日代理
    360代理IP
    流年免费HTTP代理IP 24小时自助提取系统
    云代理
    秘密代理IP
    迷惘网络IP代理
    敲代码 免费代理IP网
    代理IP检测平台,100免费代理IP
    瑶瑶代理IP
    米扑代理
    httpdaili
    蚂蚁代理
    风云代理IP
    开心代理
    讯代理
    急速IP

  • 相关阅读:
    Ant学习-002-ant 执行 TestNG 测试用例时 [testng] java.lang.NoClassDefFoundError: com/beust/jcommander/ParameterException 解决方案
    Ant学习-001-ant 基础知识及windows环境配置
    Selenium2学习-032-WebUI自动化实战实例-030-JavaScript 在 Selenium 自动化中的应用实例之五(高亮标示元素)
    Selenium2学习-031-WebUI自动化实战实例-029-JavaScript 在 Selenium 自动化中的应用实例之四(获取元素位置和大小)
    Selenium2学习-030-WebUI自动化实战实例-028-获取元素位置及大小
    Selenium2学习-029-WebUI自动化实战实例-027-判断元素是否存在
    Selenium2学习-028-WebUI自动化实战实例-026-获取页面元素值或者元素属性值
    Selenium2学习-027-WebUI自动化实战实例-025-JavaScript 在 Selenium 自动化中的应用实例之三(页面滚屏,模拟鼠标拖动滚动条)
    Selenium2学习-026-WebUI自动化实战实例-024-获取页面元素
    Selenium2学习-025-WebUI自动化实战实例-023-页面快照截图应用之一 -- 常规截图(全页面)
  • 原文地址:https://www.cnblogs.com/jamnoble/p/10920047.html
Copyright © 2011-2022 走看看