zoukankan      html  css  js  c++  java
  • C#如何使用HttpWebRequest、HttpWebResponse模拟浏览器抓取网页内容

    public string GetHtml(string url, Encoding ed)
            {
                string Html = string.Empty;//初始化新的webRequst
                HttpWebRequest Request = (HttpWebRequest)WebRequest.Create(url);
    
                Request.KeepAlive = true;
                Request.ProtocolVersion = HttpVersion.Version11;
                Request.Method = "GET";
                Request.Accept = "*/* ";
                Request.UserAgent = "Mozilla/5.0 (Windows NT 6.1) AppleWebKit/536.5 (KHTML, like Gecko) Chrome/19.0.1084.56 Safari/536.5";
                Request.Referer = url;
    
                HttpWebResponse htmlResponse = (HttpWebResponse)Request.GetResponse();
                //从Internet资源返回数据流
                Stream htmlStream = htmlResponse.GetResponseStream();
                //读取数据流
                StreamReader weatherStreamReader = new StreamReader(htmlStream, ed);
                //读取数据
                Html = weatherStreamReader.ReadToEnd();
                weatherStreamReader.Close();
                htmlStream.Close();
                htmlResponse.Close();
                //针对不同的网站查看html源文件
                return Html;
            }
    
            public string GetHtml(string url)
            {
                return GetHtml(url, Encoding.UTF8);
            }
  • 相关阅读:
    字典常用操作复习
    列表常用方法复习
    爬虫流程复习
    协程解决素数
    yield 复习
    多线程复习2
    多线程复习1
    异常 巩固3
    logging日志基础示例
    2019最新百度网盘不限速下载教程
  • 原文地址:https://www.cnblogs.com/huangcong/p/4380644.html
Copyright © 2011-2022 走看看