zoukankan      html  css  js  c++  java
  • HttpWebResponse获取DOM数据注意之ContentEncoding

    public string GetKaiJ(string type = "ssq")
            {
                /*1.通过WebBrowser控件&HttpWebRequest获得网站信息*/
                switch (type)
                {
                    case "ssq":
                        req = (HttpWebRequest)HttpWebRequest.Create(url_ssq);
                        break;
                    case "dlt":
                        req = (HttpWebRequest)HttpWebRequest.Create(url_dlt);
                        break;
                    default:
                        req = (HttpWebRequest)HttpWebRequest.Create(url_ssq);
                        break;
                   }
    
                req.ContentType = "text/html";
                req.Method = "GET";
                req.Timeout = 1000;
                /*2.数据处理*/   
                HttpWebResponse response = (HttpWebResponse)req.GetResponse();
    
                /**在这里对接收到的页面内容进行处理
                 * 说明:HttpWebResponse.ContentEncoding会返回两种情况:ContentEncoding="";ContentEncoding="gzip";
                 * gzip的情况需要解压,就是第一种情况;注意gzip要小写;
                 * 如果不注意这两种情况,网站返回的数据有时候会间隔以这两种情况返回;造成有时候编码正常,有时乱码
                 * 对于这两种情况要进行分别的数据解析
                 */
                if (response.ContentEncoding == "gzip") {
                    //using (Stream resStream = response.GetResponseStream())
                    using (var resStream = new System.IO.Compression.GZipStream(response.GetResponseStream(), System.IO.Compression.CompressionMode.Decompress))
                    {
                        //using (StreamReader reader = new StreamReader(resStream,myEncoding))
                        using (var reader = new StreamReader(resStream, System.Text.Encoding.Default))
                        {
                            responseContent = reader.ReadToEnd().ToString();
    
                            // Read and display lines from the file until the end of
                            // the file is reached.
                            //string line;
                            //while ((line = reader.ReadLine()) != null)
                            //{
                            //    Console.WriteLine(line);
                            //}
                        }
                    }
                } else if (response.ContentEncoding == "") {
                    using (var resStream = response.GetResponseStream())
                    //using (Stream resStream = new System.IO.Compression.GZipStream(response.GetResponseStream(), System.IO.Compression.CompressionMode.Decompress))
                    {
                        //using (StreamReader reader = new StreamReader(resStream,myEncoding))
                        using (StreamReader reader = new StreamReader(resStream, myEncoding_default))
                        {
                            responseContent = reader.ReadToEnd().ToString();
    
                            // Read and display lines from the file until the end of
                            // the file is reached.
                            //string line;
                            //while ((line = reader.ReadLine()) != null)
                            //{
                            //    Console.WriteLine(line);
                            //}
                        }
                    }
                } else { }
                return $"{responseContent}
    responseContentEncoding:{response.ContentEncoding}"; 
            }
  • 相关阅读:
    为什么单个TCP连接很难占满带宽
    上传NUnit的单元测试结果和OpenCover的单元测试覆盖率到SonarQube服务中
    使用Visual Studio Code Coverage和nunit上传单元测试覆盖率和单元测试结果到SonarQube上
    java安装1.8的经验和Error: Registry key 'SoftwareJavaSoftJava Runtime Environment'CurrentVers问题处理
    NSubstitute.Analyzers检测NSubstitute用法冲突
    在TeamCity中执行gtest单元测试
    iOS OpenGL ES入门
    iOS 基础知识
    【内推】字节跳动-头条小说&番茄小说
    iOS开发小记(十四)
  • 原文地址:https://www.cnblogs.com/nick-jd/p/13559720.html
Copyright © 2011-2022 走看看