zoukankan      html  css  js  c++  java
  • 登陆抓取数据


              

                string url1 = @"http://login.vancl.com/Login/";                   //提交注册信息的网址
                string url2 = @"http://my.vancl.com/User/User_Order_List.aspx";    //需要下载的网页

                string indata = "mailto:Logintrue=true&UserName=jsycywm@hotmail.com&PassWord=我的密码&x=45&y=15";

                CookieContainer myCookieContainer = new CookieContainer();                      //新建一个CookieContainer来存放Cookie集合
                HttpWebRequest myHttpWebRequest = (HttpWebRequest)WebRequest.Create(url1);      //新建一个HttpWebRequest
                myHttpWebRequest.ContentType = "application/x-www-form-urlencoded";
                myHttpWebRequest.ContentLength = indata.Length;
                //myHttpWebRequest.ac
                myHttpWebRequest.Method = "POST";
                myHttpWebRequest.CookieContainer = myCookieContainer;                           //设置HttpWebRequest的CookieContainer为刚才建立的那个myCookieContainer
                Stream myRequestStream = myHttpWebRequest.GetRequestStream();
                StreamWriter myStreamWriter = new StreamWriter(myRequestStream, Encoding.GetEncoding("GB2312"));
                myStreamWriter.Write(indata);           //把数据写入HttpWebRequest的Request流

                myStreamWriter.Close();
                myRequestStream.Close();                //关闭打开对象


                HttpWebResponse myHttpWebResponse = (HttpWebResponse)myHttpWebRequest.GetResponse();        //新建一个HttpWebResponse
                myHttpWebResponse.Cookies = myCookieContainer.GetCookies(myHttpWebRequest.RequestUri);      //获取一个包含url的Cookie集合的CookieCollection
                Stream myResponseStream = myHttpWebResponse.GetResponseStream();
                StreamReader myStreamReader = new StreamReader(myResponseStream, Encoding.UTF8 );
                string outdata = myStreamReader.ReadToEnd();//把数据从HttpWebResponse的Response流中读出
                myStreamReader.Close();
                myResponseStream.Close();
                //Console.WriteLine(outdata);//显示"登录"
                //拿到了Cookie,再进行请求就能直接读取到登录后的内容了
                myHttpWebRequest = (HttpWebRequest)WebRequest.Create(url2);
                myHttpWebRequest.CookieContainer = myCookieContainer;//*
                //刚才那个CookieContainer已经存有了Cookie,把它附加到HttpWebRequest中则能直接通过验证
                myHttpWebResponse = (HttpWebResponse)myHttpWebRequest.GetResponse();
                myHttpWebResponse.Cookies = myCookieContainer.GetCookies(myHttpWebRequest.RequestUri);
                myResponseStream = myHttpWebResponse.GetResponseStream();
                myStreamReader = new StreamReader(myResponseStream, Encoding.UTF8);
                outdata = myStreamReader.ReadToEnd();
                myStreamReader.Close();
                myResponseStream.Close();
                //Response.Redirect(url2);
                //Console.WriteLine(outdata);
                //再次显示"登录"
                //如果把*行注释调,就显示"没有登录"
                string abc = outdata.Substring(413, outdata.Length - 413 - 11); //.Replace("title", "tag")
                //  abc = Regex.Replace(abc,"<!--User_Interface End-->.*?<!--Bottom-->" , "");//"title=\".*?\"|title='.*?'|<img.*?\">"
                Match mc = Regex.Match(abc, "<table>.*?/table>");//<div id=\"main\">.*?</div>  Regex.Matches(abc, "<table>.*?/table>")[0].Value
                abc = Regex.Replace(mc.Value, "<thead>.*?thead>", "");
             // MatchCollection results
     
                XmlDocument xmlDoc = new XmlDocument();
                xmlDoc.LoadXml(abc );
                XmlNode xn = xmlDoc.SelectSingleNode("table");
                XmlElement xe = (XmlElement)xn;
                //xn.ChildNodes[0].ChildNodes[1].InnerText 
                //xn.ChildNodes.Count
                string result = xe.InnerText;

  • 相关阅读:
    Sendkeys 和 Sendmessage 使用技巧一例
    和菜鸟一起学算法之二分法求极值问题
    和菜鸟一起学算法之三分法求极值问题
    和菜鸟一起学证券投资之国内生产总值GDP
    和菜鸟一起学OK6410之Led字符驱动
    和菜鸟一起学OK6410之最简单驱动模块hello world
    和菜鸟一起学OK6410之交叉编译hello world
    和菜鸟一起学android4.0.3源码之touchscreen配置+调试记录
    和菜鸟一起学android4.0.3源码之红外遥控器适配
    和菜鸟一起学OK6410之最简单字符驱动
  • 原文地址:https://www.cnblogs.com/winner/p/1444701.html
Copyright © 2011-2022 走看看