zoukankan      html  css  js  c++  java
  • Python刷CSDN阅读数(仅供娱乐)

    #!/usr/bin/env python
    # -*- coding: utf-8 -*-
    """
    @File:csdn_reads.py    
    @E-mail:364942727@qq.com
    @Time:2020/4/16 10:03 下午 
    @Author:Nobita   
    @Version:1.0   
    @Desciption:None
    """
    
    import re
    import time
    import random
    import requests
    import urllib.request
    from bs4 import BeautifulSoup
    
    user_agent_list = [
        "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Safari/537.36",
        "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/67.0.3396.99 Safari/537.36",
        "Mozilla/5.0 (Windows NT 10.0; …) Gecko/20100101 Firefox/61.0",
        "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/64.0.3282.186 Safari/537.36",
        "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/62.0.3202.62 Safari/537.36",
        "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/45.0.2454.101 Safari/537.36",
        "Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.0)",
        "Mozilla/5.0 (Macintosh; U; PPC Mac OS X 10.5; en-US; rv:1.9.2.15) Gecko/20110303 Firefox/3.6.15",
    ]
    firefoxHead = {"User-Agent": user_agent_list}
    firefoxHead['User-Agent'] = random.choice(user_agent_list)
    IPRegular = r"(([1-9]?d|1d{2}|2[0-4]d|25[0-5]).){3}([1-9]?d|1d{2}|2[0-4]d|25[0-5])"
    host = "https://blog.csdn.net"
    url = "https://blog.csdn.net/hz90s/article/details/{}"
    code = ["105518260"]
    
    
    def parseIPList(url="http://www.xicidaili.com/"):
        IPs = []
        request = urllib.request.Request(url, headers=firefoxHead)
        response = urllib.request.urlopen(request)
        soup = BeautifulSoup(response, "html.parser")
        tds = soup.find_all("td")
        for td in tds:
            string = str(td.string)
            if re.search(IPRegular, string):
                IPs.append(string)
        return IPs
    
    
    def PV(code):
        s = requests.Session()
        s.headers = firefoxHead['User-Agent']
        count = 0
        while True:
            count += 1
            print("asking for {} times	".format(count), end="	")
            IPs = parseIPList()
            s.proxies = {"http": "{}:8080".format(IPs[random.randint(0, 40)])}
            s.get(host)
            r = s.get(url.format(code))
            html = r.text
            soup = BeautifulSoup(html, "html.parser")
            spans = soup.find_all("span")
            print(spans[2].string)
            time.sleep(random.randint(60, 75))
    
    
    def main():
        PV(code[0])
    
    
    if __name__ == "__main__":
        main()
  • 相关阅读:
    IfElseActivity
    Tracking_自定义跟踪服务
    CallExternalMethodActivity
    在VSS2005中建立工作流项目(1)
    入门篇(2):了解一下WF是如何运行的
    WorkflowInstance类
    写了一个例子
    一个简单的态机模式工作流演示(2)(代码与实现)
    在产品中为用户提供流程设计器
    WorkflowRuntime
  • 原文地址:https://www.cnblogs.com/chenshengkai/p/12717397.html
Copyright © 2011-2022 走看看