HttpWebRequest 模拟登录响应点击事件(分享自己用的HttpHelper类)

  平时也经常采集网站数据,也做模拟登录,但一般都是html控件POST到页面登录;还没有遇到用户服务器控件button按钮点击事件登录的,今天像往常一样POST传递参数,但怎么都能登录不了;最后发现还有两个参数需要传,__EVENTVALIDATION__VIEWSTATE

  在传的过程中需要对参数值进行URL编码

  System.Web.HttpUtility.UrlEncode(value)

  模拟登录代码:在本地写的一个测试的网站来模拟登录,原理都一样:

        Request request = new Request();
            request.Method = Method.POST;
            request.Add("UserName", "1");
            request.Add("PassWord", "1");
            request.Add("btnLogin", "Button");
            HtmlHelper html = new HtmlHelper();
            Response response = html.GetHTML("http://localhost:64554/Lgoin.aspx");
            Match math = Regex.Match(response.Html, "<input type=\"hidden\" name=\"__VIEWSTATE\" id=\"__VIEWSTATE\" value=\"(?<val>.*?)\" />", RegexOptions.Singleline | RegexOptions.IgnoreCase);
            string value = math.Groups["val"].Value;
            request.Add("__VIEWSTATE", System.Web.HttpUtility.UrlEncode(value));
            math = Regex.Match(response.Html, "<input type=\"hidden\" name=\"__EVENTVALIDATION\" id=\"__EVENTVALIDATION\" value=\"(?<val>.*?)\" />", RegexOptions.Singleline | RegexOptions.IgnoreCase);
            request.Add("__EVENTVALIDATION", System.Web.HttpUtility.UrlEncode(math.Groups["val"].Value));
            response = html.GetHTML("http://localhost:64554/Lgoin.aspx", true, request);

 

  这里发布哈,我平时用的HttpHelper类

 #region 发送方式
    public enum Method
    {
        GET, POST
    }
    #endregion

    #region 返回内容
    /// <summary>
    /// 返回内容
    /// </summary>
    public class Response
    {
        #region 远程服务器时间
        DateTime _RemoteDateTime = Convert.ToDateTime("1900-01-01 00:00:00.000");
        /// <summary>
        /// 远程服务器时间
        /// </summary>
        public DateTime RemoteDateTime
        {
            get { return _RemoteDateTime; }
            set { _RemoteDateTime = value; }
        }
        #endregion

        #region 返回内容
        string html = string.Empty;
        /// <summary>
        /// 返回内容
        /// </summary>
        public string Html
        {
            get { return html; }
            set { html = value; }
        }
        #endregion

        #region 返回的Cookies
        CookieContainer _Cookies = new CookieContainer();
        /// <summary>
        /// 返回的Cookies
        /// </summary>
        public CookieContainer Cookies
        {
            get { return _Cookies; }
            set { _Cookies = value; }
        }
        #endregion

        #region HTTP状态代码
        /// <summary>
        /// HTTP状态代码
        /// </summary>
        public HttpStatusCode StatusCode { get; set; }
        #endregion

        #region 返回的图片内容
        Image _Image = null;
        /// <summary>
        /// 返回的图片内容
        /// </summary>
        public Image Image
        {
            get { return _Image; }
            set { _Image = value; }
        }
        #endregion

        #region 当前URL
        string _Url = string.Empty;
        /// <summary>
        /// 当前URL
        /// </summary>
        public string Url
        {
            get { return _Url; }
            set { _Url = value; }
        }
        #endregion
    }
    #endregion

    #region 发送数据
    /// <summary>
    /// 发送数据
    /// </summary>
    [Serializable]
    public class Request
    {
        List<KeyValuePair<string, string>> sList = new List<KeyValuePair<string, string>>();
        Method _sendMethod = Method.GET;
        public Method Method
        {
            get { return _sendMethod; }
            set { _sendMethod = value; }
        }

        private CookieContainer _Cookies = new CookieContainer();
        public CookieContainer Cookies
        {
            get { return this._Cookies; }
            set { this._Cookies = value; }
        }
        public void Clear()
        {
            this.sList.Clear();
        }
        public void Add(string key, string value)
        {
            this.sList.Add(new KeyValuePair<string, string>(key, value));
        }
        public void Update(string key, string value)
        {
            int index = -1;
            for (int i = 0; i < this.List.Count; i++)
            {
                if (this.List[i].Key.Equals(key))
                {
                    index = i;
                    break;
                }
            }

            if (index > 0)  this.List.RemoveAt(index);

            this.List.Add(new KeyValuePair<string, string>(key, value));
        }
        public override string ToString()
        {
            string sRet = string.Empty;

            foreach (KeyValuePair<string,string> val in this.sList)
            {
                if (sRet.Length == 0)
                    sRet = string.Format("{0}={1}", val.Key, val.Value);
                else
                    sRet = string.Format("{0}&{1}={2}", sRet, val.Key, val.Value);
            }

            return sRet;
        }

        public byte[] ToBytes()
        {
            return Encoding.ASCII.GetBytes(this.ToString());
        }

        public List<KeyValuePair<string,string>> List
        {
            set
            {
                this.sList = value;
            }
            get
            {
                return this.sList;
            }
        }

        public string Find(string key)
        {
            string sRet = string.Empty;

            KeyValuePair<string, string> val = this.List.Find(delegate(KeyValuePair<string, string> k) { return k.Key.Equals(key); });

            sRet = val.Value;

            return sRet;
        }

    }
    #endregion

    public class HtmlHelper
    {
        public static HtmlHelper Init()
        {
            return new HtmlHelper();
        }



        #region Cookies
        CookieContainer _Cookies = new CookieContainer();
        /// <summary>
        /// Cookies
        /// </summary>
        public CookieContainer Cookies
        {
            get { return _Cookies; }
            set { _Cookies = value; }
        }
        #endregion

        #region 连接远程服务器超时触发事件
        public delegate void Connection_TimeOut_Handle(string sUrl, Request request, Exception ex);
        /// <summary>
        /// 连接远程服务器超时触发事件
        /// </summary>
        public event Connection_TimeOut_Handle Connection_TimeOut;
        #endregion

        #region 获取数据完毕触发事件
        public delegate void Connection_Complete_Handle(Response response);
        /// <summary>
        ///  获取数据完毕触发事件
        /// </summary>
        public event Connection_Complete_Handle Connection_Complete;
        #endregion

        #region 设置发送头信息
        /// <summary>
        /// 设置发送头信息
        /// </summary>
        /// <param name="request"></param>
        private void SetRequestHeader(ref HttpWebRequest request, string referer)
        {
            request.Timeout = 5000;
            request.Accept = "*/*";
            request.UserAgent = "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.2; SV1; .NET CLR 2.0.50727;)";
            request.Headers["Accept-Encoding"] = "gzip, deflate";
            request.Headers["Accept-Language"] = "zh-cn";
            request.Headers["Accept-Charset"] = "utf-8;q=0.7,*;q=0.7";
            request.ContentType = "application/x-www-form-urlencoded";
            request.Referer = referer;
            request.KeepAlive = true;
        }
        #endregion

        #region 解压经过Gzip压缩的流
        /// <summary>
        /// 解压经过Gzip压缩的流
        /// </summary>
        /// <param name="contentEncoding">流编码</param>
        /// <param name="resonseStream">网页返回的流内容</param>
        /// <returns></returns>
        private string GzipStreame(string ecoding, Stream resonseStream)
        {
            return GzipStreame(ecoding, resonseStream, Encoding.UTF8);
        }
        private string GzipStreame(string ecoding, Stream resonseStream, Encoding coding)
        {
            string html = string.Empty;
            if (ecoding.ToLower().IndexOf("gzip") != -1)
            {
                html = new StreamReader(new GZipStream(resonseStream, CompressionMode.Decompress), coding).ReadToEnd();
            }
            else if (ecoding.ToLower().IndexOf("deflate") >= 0)
            {
                html = new StreamReader(new DeflateStream(resonseStream, CompressionMode.Decompress), coding).ReadToEnd();
            }
            else
            {
                html = new StreamReader(resonseStream, coding).ReadToEnd();
            }
            return html;
        }

        #endregion

        #region 获取远程HTML
        /// <summary>
        /// 获取远程HTML
        /// </summary>
        /// <param name="url">地址</param>
        /// <returns></returns>
        public Response GetHTML(string url)
        {
            return GetHTML(url, false, new Request(), new Uri(url).Host, Encoding.UTF8, null);
        }
        public Response GetHTML(string url, WebProxy proxy)
        {
            return GetHTML(url, false, new Request(), new Uri(url).Host, Encoding.UTF8, proxy);
        }
        public Response GetHTML(string url, Encoding coding)
        {
            return GetHTML(url, false, new Request(), new Uri(url).Host, coding, null);
        }
        public Response GetHTML(string url, Encoding coding, WebProxy proxy)
        {
            return GetHTML(url, false, new Request(), new Uri(url).Host, coding, proxy);
        }
        /// <summary>
        /// 获取远程HTML
        /// </summary>
        /// <param name="url">地址</param>
        /// <param name="send">是否自动重定向URL</param>
        /// <returns></returns>
        public Response GetHTML(string url, bool bAllowAutoRedirect)
        {
            return GetHTML(url, bAllowAutoRedirect, new Request() { }, new Uri(url).Host, Encoding.UTF8, null);
        }
        public Response GetHTML(string url, bool bAllowAutoRedirect, WebProxy porxy)
        {
            return GetHTML(url, bAllowAutoRedirect, new Request() { }, new Uri(url).Host, Encoding.UTF8, porxy);
        }
        /// <summary>
        /// 获取远程HTML
        /// </summary>
        /// <param name="sUrl">地址</param>
        /// <param name="send">发送内容</param>
        /// <returns></returns>
        public Response GetHTML(string url, Request request)
        {
            return GetHTML(url, request, Encoding.UTF8);
        }
        public Response GetHTML(string url, Request request, WebProxy porxy)
        {
            return GetHTML(url, false, request, new Uri(url).Host, Encoding.UTF8, porxy);
        }
        public Response GetHTML(string url, bool bAllowAutoRedirect, Request request)
        {
            return GetHTML(url, bAllowAutoRedirect, request, new Uri(url).Host, Encoding.UTF8, null);
        }
        public Response GetHTML(string url, bool bAllowAutoRedirect, Request request, WebProxy proxy)
        {
            return GetHTML(url, bAllowAutoRedirect, request, new Uri(url).Host, Encoding.UTF8, proxy);
        }
        public Response GetHTML(string url, Request request, Encoding coding)
        {
            return GetHTML(url, false, request, new Uri(url).Host, coding, null);
        }
        public Response GetHTML(string url, Request request, Encoding coding, WebProxy proxy)
        {
            return GetHTML(url, false, request, new Uri(url).Host, coding, proxy);
        }
        /// <summary>
        /// 获取远程HTML
        /// </summary>
        /// <param name="sUrl">地址</param>
        /// <param name="bAllowAutoRedirect">是否自动跳转</param>
        /// <param name="send">发送内容</param>
        /// <returns></returns>
        public Response GetHTML(string sUrl, bool bAllowAutoRedirect, Request request, string referer)
        {
            return GetHTML(sUrl, bAllowAutoRedirect, request, referer, Encoding.UTF8, null);
        }
        public Response GetHTML(string sUrl, bool bAllowAutoRedirect, Request request, string referer, WebProxy proxy)
        {
            return GetHTML(sUrl, bAllowAutoRedirect, request, referer, Encoding.UTF8, proxy);
        }
        /// <summary>
        /// 获取HTML页面内容
        /// </summary>
        /// <param name="url">地址</param>
        /// <param name="bAllowAutoRedirect">是否自动跳转</param>
        /// <param name="request">查询信息</param>
        /// <param name="referer">引用页</param>
        /// <param name="coding">编码格式</param>
        /// <returns></returns>
        public Response GetHTML(string url, bool bAllowAutoRedirect, Request request, string referer, Encoding coding, WebProxy proxy)
        {
            Response result = new Response();

            if (request.Method == Method.GET)
            {
                string sData = request.ToString();
                if (sData.Length > 0) url = string.Format("{0}?{1}", url, sData);
            }

            HttpWebRequest httpRequest = (HttpWebRequest)WebRequest.Create(url);
            if (proxy != null) httpRequest.Proxy = proxy;

            #region SSL方式
            if (url.Contains("https://"))
            {
                //这一句一定要写在创建连接的前面。使用回调的方法进行证书验证。
                ServicePointManager.ServerCertificateValidationCallback = new System.Net.Security.RemoteCertificateValidationCallback(CheckValidationResult);
                //创建证书文件
                X509Certificate objx509 = new X509Certificate();

                //添加到请求里
                httpRequest.ClientCertificates.Add(objx509);
            }
            #endregion

            // 设置发送头信息
            if (referer.Length == 0)
                SetRequestHeader(ref httpRequest, new Uri(url).Host);
            else
                SetRequestHeader(ref httpRequest, referer);
            // 自动重定向
            httpRequest.AllowAutoRedirect = bAllowAutoRedirect;
            httpRequest.Timeout = 60 * 1000;
            // 关联Cookies
            //if (httpRequest.CookieContainer == null)
            //    httpRequest.CookieContainer = new CookieContainer();
            httpRequest.CookieContainer = this.Cookies;

            try
            {

                if (request.Method == Method.POST)
                {
                    // 设置发送方式
                    httpRequest.Method = request.Method.ToString();
                    // 获取发送数据流
                    //HttpWebResponse response = httpRequest.GetResponse() as HttpWebResponse;

                    Stream strem = httpRequest.GetRequestStream();

                    // 写入发送数据
                    byte[] bs = request.ToBytes();
                    strem.Write(bs, 0, bs.Length);
                    strem.Close();
                }

                HttpWebResponse httpResponse = httpRequest.GetResponse() as HttpWebResponse;

                Stream responseStream = httpResponse.GetResponseStream();

                StreamReader sr = new StreamReader(responseStream, coding);

                //result.Html = sr.ReadToEnd();
                result.Html = System.Web.HttpUtility.HtmlDecode(GzipStreame(httpResponse.ContentEncoding, responseStream, coding));
                result.RemoteDateTime = Convert.ToDateTime(httpResponse.GetResponseHeader("Date"));

                result.Url = httpResponse.ResponseUri.OriginalString;

                this.Cookies.Add(httpResponse.Cookies);

                result.Cookies = this.Cookies;

                result.StatusCode = httpResponse.StatusCode;

                responseStream.Dispose();

                if (this.Connection_Complete != null)
                    this.Connection_Complete.Invoke(result);
            }
            catch (Exception ex)
            {
                if (this.Connection_TimeOut != null)
                    this.Connection_TimeOut.Invoke(url, request, ex);
            }
            return result;
        }

        private bool CheckValidationResult(object sender, X509Certificate certificate, X509Chain chain, SslPolicyErrors sslPolicyErrors)
        {
            return true;
        }

        #endregion

        #region 获取远程图片
        public Response GetImage(string sUrl)
        {
            return GetImage(sUrl, false, new Request());
        }
        public Response GetImage(string sUrl, WebProxy proxy)
        {
            return GetImage(sUrl, false, new Request(), proxy);
        }
        public Response GetImage(string sUrl, string referer)
        {
            return GetImage(sUrl, false, referer, null);
        }
        public Response GetImage(string sUrl, string referer, WebProxy proxy)
        {
            return GetImage(sUrl, false, referer, proxy);
        }
        public Response GetImage(string sUrl, bool bAllowAutoRedirect, string referer)
        {
            return GetImage(sUrl, bAllowAutoRedirect, new Request(), referer, null);
        }
        public Response GetImage(string sUrl, bool bAllowAutoRedirect, string referer, WebProxy proxy)
        {
            return GetImage(sUrl, bAllowAutoRedirect, new Request(), referer, null);
        }
        //public Image GetImage(string sUrl, bool bAllowAutoRedirect, Request request)
        //{
        //    return GetImage(sUrl, bAllowAutoRedirect, request, new CookieContainer(), "");
        ////}
        //public Image GetImage(string sUrl, bool bAllowAutoRedirect, Request request, string referer)
        //{
        //    return GetImage(sUrl, bAllowAutoRedirect, request,referer);
        //}
        /// <summary>
        /// 获取远程图片
        /// </summary>
        /// <param name="sUrl">图片地址</param>
        /// <param name="bAllowAutoRedirect">是否自动跳转</param>
        /// <param name="send">发送内容</param>
        /// <returns></returns>
        public Response GetImage(string sUrl, bool bAllowAutoRedirect, Request request)
        {
            return GetImage(sUrl, bAllowAutoRedirect, request, "", null);
        }
        public Response GetImage(string sUrl, bool bAllowAutoRedirect, Request request, string referer)
        {
            return GetImage(sUrl, bAllowAutoRedirect, request, referer, null);
        }
        public Response GetImage(string sUrl, bool bAllowAutoRedirect, Request request, WebProxy proxy)
        {
            return GetImage(sUrl, bAllowAutoRedirect, request, "", proxy);
        }
        /// <summary>
        /// 获取远程图片
        /// </summary>
        /// <param name="sUrl">图片地址</param>
        /// <param name="bAllowAutoRedirect">是否自动跳转</param>
        /// <param name="send">发送内容</param>
        /// <returns></returns>
        public Response GetImage(string url, bool bAllowAutoRedirect, Request request, string referer, WebProxy proxy)
        {
            Response response = new Response();

            if (request.Method == Method.GET)
            {
                string sData = request.ToString();
                if (sData.Length > 0) url = string.Format("{0}?{1}", url, sData);
            }

            HttpWebRequest httpRequest = (HttpWebRequest)WebRequest.Create(url);
            if (proxy != null) httpRequest.Proxy = proxy;

            #region SSL方式
            if (url.Contains("https://"))
            {
                //这一句一定要写在创建连接的前面。使用回调的方法进行证书验证。
                ServicePointManager.ServerCertificateValidationCallback = new System.Net.Security.RemoteCertificateValidationCallback(CheckValidationResult);
                //创建证书文件
                X509Certificate objx509 = new X509Certificate();

                //添加到请求里
                httpRequest.ClientCertificates.Add(objx509);
            }
            #endregion

            // 设置发送头信息
            if (referer.Length == 0)
                SetRequestHeader(ref httpRequest, new Uri(url).Host);
            else
                SetRequestHeader(ref httpRequest, referer);

            // 自动重定向
            httpRequest.AllowAutoRedirect = bAllowAutoRedirect;
            // 关联Cookies
            httpRequest.CookieContainer = this.Cookies;

            try
            {

                if (request.Method == Method.POST)
                {
                    // 设置发送方式
                    httpRequest.Method = request.Method.ToString();
                    // 获取发送数据流
                    //HttpWebResponse response = httpRequest.GetResponse() as HttpWebResponse;

                    Stream strem = httpRequest.GetRequestStream();

                    // 写入发送数据
                    byte[] bs = request.ToBytes();
                    strem.Write(bs, 0, bs.Length);
                    strem.Close();
                }

                HttpWebResponse httpResponse = httpRequest.GetResponse() as HttpWebResponse;

                Stream responseStream = httpResponse.GetResponseStream();

                //if (responseStream.CanSeek)
                //{
                response.Image = Image.FromStream(responseStream);
                //}
                //else
                //{
                //   response.Image = null;
                //}
                response.RemoteDateTime = Convert.ToDateTime(httpResponse.GetResponseHeader("Date"));

                this.Cookies.Add(httpResponse.Cookies);
                response.Cookies = this.Cookies;
                response.StatusCode = httpResponse.StatusCode;
                responseStream.Dispose();
                responseStream.Close();
            }
            catch (Exception ex)
            {
                if (this.Connection_TimeOut != null)
                    this.Connection_TimeOut.Invoke(url, request, ex);
            }

            return response;
        }
        #endregion

        #region 异步获取远程HTML
        /// <summary>
        /// 异步获取远程HTML
        /// </summary>
        /// <param name="sUrl">地址</param>
        /// <returns></returns>
        public void BeginGetHTML(string sUrl)
        {
            BeginGetHTML(sUrl, false, new Request() { });
        }
        /// <summary>
        /// 异步获取远程HTML
        /// </summary>
        /// <param name="sUrl">地址</param>
        /// <param name="send">是否自动重定向URL</param>
        /// <returns></returns>
        public void BeginGetHTML(string sUrl, bool bAllowAutoRedirect)
        {
            BeginGetHTML(sUrl, bAllowAutoRedirect, new Request() { });
        }
        /// <summary>
        /// 异步获取远程HTML
        /// </summary>
        /// <param name="sUrl">地址</param>
        /// <param name="send">发送内容</param>
        /// <returns></returns>
        public void BeginGetHTML(string sUrl, Request request)
        {
            BeginGetHTML(sUrl, false, request);
        }
        /// <summary>
        /// 异步获取远程HTML
        /// </summary>
        /// <param name="sUrl">地址</param>
        /// <param name="bAllowAutoRedirect">是否自动跳转</param>
        /// <param name="send">发送内容</param>
        /// <returns></returns>
        public void BeginGetHTML(string sUrl, bool bAllowAutoRedirect, Request request)
        {
            Response result = new Response();

            if (request.Method == Method.GET)
            {
                string sData = request.ToString();
                if (sData.Length > 0) sUrl = string.Format("{0}?{1}", sUrl, sData);
            }

            HttpWebRequest httpRequest = (HttpWebRequest)WebRequest.Create(sUrl);
            // 设置发送头信息
            SetRequestHeader(ref httpRequest, new Uri(sUrl).Host);
            // 自动重定向
            httpRequest.AllowAutoRedirect = bAllowAutoRedirect;

            if (request.Method == Method.POST)
            {
                // 设置发送方式
                httpRequest.Method = request.Method.ToString();

                // 获取发送数据流
                Stream stream = httpRequest.GetRequestStream();

                byte[] bs = request.ToBytes();
                stream.Write(bs, 0, bs.Length);
                stream.Close();
                //httpRequest.BeginGetRequestStream(new AsyncCallback(GetRequestStreamCallback),httpRequest);
                // 写入发送数据

            }

            //HttpWebResponse httpResponse = httpRequest.GetResponse() as HttpWebResponse;

            AsyncCallback callback = new AsyncCallback(GetResponseStreamCallback);
            try
            {
                httpRequest.BeginGetResponse(callback, httpRequest);
            }
            catch (WebException ex)
            {
                if (this.Connection_TimeOut != null)
                    this.Connection_TimeOut.Invoke(sUrl, request, ex);
            }
        }

        private void GetRequestStreamCallback(IAsyncResult ar)
        {
            //Request request = ar.AsyncState as Request;
            //Stream stream = async.EndGetRequestStream(ar);

            //byte[] bs = request.ToBytes();
            //stream.Write(bs, 0, bs.Length);
            //stream.Close();
        }

        private void GetResponseStreamCallback(IAsyncResult ar)
        {
            HttpWebRequest httpRequest = ar.AsyncState as HttpWebRequest;
            HttpWebResponse httpResponse = httpRequest.EndGetResponse(ar) as HttpWebResponse;

            Stream responseStream = httpResponse.GetResponseStream();

            Response response = new Response();

            response.Html = GzipStreame(httpResponse.ContentEncoding, responseStream);
            response.RemoteDateTime = Convert.ToDateTime(httpResponse.GetResponseHeader("Date"));
            //response.Cookies = httpResponse.Cookies;

            if (this.Connection_Complete != null)
                this.Connection_Complete.Invoke(response);
        }
        #endregion
    }

 

你可能感兴趣的:(request)