平時也常常採集網站數據,也作模擬登陸,但通常都是html控件POST到頁面登陸;尚未遇到用戶服務器控件button按鈕點擊事件登陸的,今天像往常同樣POST傳遞參數,但怎麼都能登陸不了;最後發現還有兩個參數須要傳,__EVENTVALIDATION和__VIEWSTATEhtml
在傳的過程當中須要對參數值進行URL編碼服務器
System.Web.HttpUtility.UrlEncode(value)
模擬登陸代碼:在本地寫的一個測試的網站來模擬登陸,原理都同樣:app
Request request = new Request(); request.Method = Method.POST; request.Add("UserName", "1"); request.Add("PassWord", "1"); request.Add("btnLogin", "Button"); HtmlHelper html = new HtmlHelper(); Response response = html.GetHTML("http://localhost:64554/Lgoin.aspx"); Match math = Regex.Match(response.Html, "<input type=\"hidden\" name=\"__VIEWSTATE\" id=\"__VIEWSTATE\" value=\"(?<val>.*?)\" />", RegexOptions.Singleline | RegexOptions.IgnoreCase); string value = math.Groups["val"].Value; request.Add("__VIEWSTATE", System.Web.HttpUtility.UrlEncode(value)); math = Regex.Match(response.Html, "<input type=\"hidden\" name=\"__EVENTVALIDATION\" id=\"__EVENTVALIDATION\" value=\"(?<val>.*?)\" />", RegexOptions.Singleline | RegexOptions.IgnoreCase); request.Add("__EVENTVALIDATION", System.Web.HttpUtility.UrlEncode(math.Groups["val"].Value)); response = html.GetHTML("http://localhost:64554/Lgoin.aspx", true, request);
這裏發佈哈,我平時用的HttpHelper類異步
#region 發送方式 public enum Method { GET, POST } #endregion #region 返回內容 /// <summary> /// 返回內容 /// </summary> public class Response { #region 遠程服務器時間 DateTime _RemoteDateTime = Convert.ToDateTime("1900-01-01 00:00:00.000"); /// <summary> /// 遠程服務器時間 /// </summary> public DateTime RemoteDateTime { get { return _RemoteDateTime; } set { _RemoteDateTime = value; } } #endregion #region 返回內容 string html = string.Empty; /// <summary> /// 返回內容 /// </summary> public string Html { get { return html; } set { html = value; } } #endregion #region 返回的Cookies CookieContainer _Cookies = new CookieContainer(); /// <summary> /// 返回的Cookies /// </summary> public CookieContainer Cookies { get { return _Cookies; } set { _Cookies = value; } } #endregion #region HTTP狀態代碼 /// <summary> /// HTTP狀態代碼 /// </summary> public HttpStatusCode StatusCode { get; set; } #endregion #region 返回的圖片內容 Image _Image = null; /// <summary> /// 返回的圖片內容 /// </summary> public Image Image { get { return _Image; } set { _Image = value; } } #endregion #region 當前URL string _Url = string.Empty; /// <summary> /// 當前URL /// </summary> public string Url { get { return _Url; } set { _Url = value; } } #endregion } #endregion #region 發送數據 /// <summary> /// 發送數據 /// </summary> [Serializable] public class Request { List<KeyValuePair<string, string>> sList = new List<KeyValuePair<string, string>>(); Method _sendMethod = Method.GET; public Method Method { get { return _sendMethod; } set { _sendMethod = value; } } private CookieContainer _Cookies = new CookieContainer(); public CookieContainer Cookies { get { return this._Cookies; } set { this._Cookies = value; } } public void Clear() { this.sList.Clear(); } public void Add(string key, string value) { this.sList.Add(new KeyValuePair<string, string>(key, value)); } public void Update(string key, string value) { int index = -1; for (int i = 0; i < this.List.Count; i++) { if (this.List[i].Key.Equals(key)) { index = i; break; } } if (index > 0) this.List.RemoveAt(index); this.List.Add(new KeyValuePair<string, string>(key, value)); } public override string ToString() { string sRet = string.Empty; foreach (KeyValuePair<string,string> val in this.sList) { if (sRet.Length == 0) sRet = string.Format("{0}={1}", val.Key, val.Value); else sRet = string.Format("{0}&{1}={2}", sRet, val.Key, val.Value); } return sRet; } public byte[] ToBytes() { return Encoding.ASCII.GetBytes(this.ToString()); } public List<KeyValuePair<string,string>> List { set { this.sList = value; } get { return this.sList; } } public string Find(string key) { string sRet = string.Empty; KeyValuePair<string, string> val = this.List.Find(delegate(KeyValuePair<string, string> k) { return k.Key.Equals(key); }); sRet = val.Value; return sRet; } } #endregion public class HtmlHelper { public static HtmlHelper Init() { return new HtmlHelper(); } #region Cookies CookieContainer _Cookies = new CookieContainer(); /// <summary> /// Cookies /// </summary> public CookieContainer Cookies { get { return _Cookies; } set { _Cookies = value; } } #endregion #region 鏈接遠程服務器超時觸發事件 public delegate void Connection_TimeOut_Handle(string sUrl, Request request, Exception ex); /// <summary> /// 鏈接遠程服務器超時觸發事件 /// </summary> public event Connection_TimeOut_Handle Connection_TimeOut; #endregion #region 獲取數據完畢觸發事件 public delegate void Connection_Complete_Handle(Response response); /// <summary> /// 獲取數據完畢觸發事件 /// </summary> public event Connection_Complete_Handle Connection_Complete; #endregion #region 設置發送頭信息 /// <summary> /// 設置發送頭信息 /// </summary> /// <param name="request"></param> private void SetRequestHeader(ref HttpWebRequest request, string referer) { request.Timeout = 5000; request.Accept = "*/*"; request.UserAgent = "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.2; SV1; .NET CLR 2.0.50727;)"; request.Headers["Accept-Encoding"] = "gzip, deflate"; request.Headers["Accept-Language"] = "zh-cn"; request.Headers["Accept-Charset"] = "utf-8;q=0.7,*;q=0.7"; request.ContentType = "application/x-www-form-urlencoded"; request.Referer = referer; request.KeepAlive = true; } #endregion #region 解壓通過Gzip壓縮的流 /// <summary> /// 解壓通過Gzip壓縮的流 /// </summary> /// <param name="contentEncoding">流編碼</param> /// <param name="resonseStream">網頁返回的流內容</param> /// <returns></returns> private string GzipStreame(string ecoding, Stream resonseStream) { return GzipStreame(ecoding, resonseStream, Encoding.UTF8); } private string GzipStreame(string ecoding, Stream resonseStream, Encoding coding) { string html = string.Empty; if (ecoding.ToLower().IndexOf("gzip") != -1) { html = new StreamReader(new GZipStream(resonseStream, CompressionMode.Decompress), coding).ReadToEnd(); } else if (ecoding.ToLower().IndexOf("deflate") >= 0) { html = new StreamReader(new DeflateStream(resonseStream, CompressionMode.Decompress), coding).ReadToEnd(); } else { html = new StreamReader(resonseStream, coding).ReadToEnd(); } return html; } #endregion #region 獲取遠程HTML /// <summary> /// 獲取遠程HTML /// </summary> /// <param name="url">地址</param> /// <returns></returns> public Response GetHTML(string url) { return GetHTML(url, false, new Request(), new Uri(url).Host, Encoding.UTF8, null); } public Response GetHTML(string url, WebProxy proxy) { return GetHTML(url, false, new Request(), new Uri(url).Host, Encoding.UTF8, proxy); } public Response GetHTML(string url, Encoding coding) { return GetHTML(url, false, new Request(), new Uri(url).Host, coding, null); } public Response GetHTML(string url, Encoding coding, WebProxy proxy) { return GetHTML(url, false, new Request(), new Uri(url).Host, coding, proxy); } /// <summary> /// 獲取遠程HTML /// </summary> /// <param name="url">地址</param> /// <param name="send">是否自動重定向URL</param> /// <returns></returns> public Response GetHTML(string url, bool bAllowAutoRedirect) { return GetHTML(url, bAllowAutoRedirect, new Request() { }, new Uri(url).Host, Encoding.UTF8, null); } public Response GetHTML(string url, bool bAllowAutoRedirect, WebProxy porxy) { return GetHTML(url, bAllowAutoRedirect, new Request() { }, new Uri(url).Host, Encoding.UTF8, porxy); } /// <summary> /// 獲取遠程HTML /// </summary> /// <param name="sUrl">地址</param> /// <param name="send">發送內容</param> /// <returns></returns> public Response GetHTML(string url, Request request) { return GetHTML(url, request, Encoding.UTF8); } public Response GetHTML(string url, Request request, WebProxy porxy) { return GetHTML(url, false, request, new Uri(url).Host, Encoding.UTF8, porxy); } public Response GetHTML(string url, bool bAllowAutoRedirect, Request request) { return GetHTML(url, bAllowAutoRedirect, request, new Uri(url).Host, Encoding.UTF8, null); } public Response GetHTML(string url, bool bAllowAutoRedirect, Request request, WebProxy proxy) { return GetHTML(url, bAllowAutoRedirect, request, new Uri(url).Host, Encoding.UTF8, proxy); } public Response GetHTML(string url, Request request, Encoding coding) { return GetHTML(url, false, request, new Uri(url).Host, coding, null); } public Response GetHTML(string url, Request request, Encoding coding, WebProxy proxy) { return GetHTML(url, false, request, new Uri(url).Host, coding, proxy); } /// <summary> /// 獲取遠程HTML /// </summary> /// <param name="sUrl">地址</param> /// <param name="bAllowAutoRedirect">是否自動跳轉</param> /// <param name="send">發送內容</param> /// <returns></returns> public Response GetHTML(string sUrl, bool bAllowAutoRedirect, Request request, string referer) { return GetHTML(sUrl, bAllowAutoRedirect, request, referer, Encoding.UTF8, null); } public Response GetHTML(string sUrl, bool bAllowAutoRedirect, Request request, string referer, WebProxy proxy) { return GetHTML(sUrl, bAllowAutoRedirect, request, referer, Encoding.UTF8, proxy); } /// <summary> /// 獲取HTML頁面內容 /// </summary> /// <param name="url">地址</param> /// <param name="bAllowAutoRedirect">是否自動跳轉</param> /// <param name="request">查詢信息</param> /// <param name="referer">引用頁</param> /// <param name="coding">編碼格式</param> /// <returns></returns> public Response GetHTML(string url, bool bAllowAutoRedirect, Request request, string referer, Encoding coding, WebProxy proxy) { Response result = new Response(); if (request.Method == Method.GET) { string sData = request.ToString(); if (sData.Length > 0) url = string.Format("{0}?{1}", url, sData); } HttpWebRequest httpRequest = (HttpWebRequest)WebRequest.Create(url); if (proxy != null) httpRequest.Proxy = proxy; #region SSL方式 if (url.Contains("https://")) { //這一句必定要寫在建立鏈接的前面。使用回調的方法進行證書驗證。 ServicePointManager.ServerCertificateValidationCallback = new System.Net.Security.RemoteCertificateValidationCallback(CheckValidationResult); //建立證書文件 X509Certificate objx509 = new X509Certificate(); //添加到請求裏 httpRequest.ClientCertificates.Add(objx509); } #endregion // 設置發送頭信息 if (referer.Length == 0) SetRequestHeader(ref httpRequest, new Uri(url).Host); else SetRequestHeader(ref httpRequest, referer); // 自動重定向 httpRequest.AllowAutoRedirect = bAllowAutoRedirect; httpRequest.Timeout = 60 * 1000; // 關聯Cookies //if (httpRequest.CookieContainer == null) // httpRequest.CookieContainer = new CookieContainer(); httpRequest.CookieContainer = this.Cookies; try { if (request.Method == Method.POST) { // 設置發送方式 httpRequest.Method = request.Method.ToString(); // 獲取發送數據流 //HttpWebResponse response = httpRequest.GetResponse() as HttpWebResponse; Stream strem = httpRequest.GetRequestStream(); // 寫入發送數據 byte[] bs = request.ToBytes(); strem.Write(bs, 0, bs.Length); strem.Close(); } HttpWebResponse httpResponse = httpRequest.GetResponse() as HttpWebResponse; Stream responseStream = httpResponse.GetResponseStream(); StreamReader sr = new StreamReader(responseStream, coding); //result.Html = sr.ReadToEnd(); result.Html = System.Web.HttpUtility.HtmlDecode(GzipStreame(httpResponse.ContentEncoding, responseStream, coding)); result.RemoteDateTime = Convert.ToDateTime(httpResponse.GetResponseHeader("Date")); result.Url = httpResponse.ResponseUri.OriginalString; this.Cookies.Add(httpResponse.Cookies); result.Cookies = this.Cookies; result.StatusCode = httpResponse.StatusCode; responseStream.Dispose(); if (this.Connection_Complete != null) this.Connection_Complete.Invoke(result); } catch (Exception ex) { if (this.Connection_TimeOut != null) this.Connection_TimeOut.Invoke(url, request, ex); } return result; } private bool CheckValidationResult(object sender, X509Certificate certificate, X509Chain chain, SslPolicyErrors sslPolicyErrors) { return true; } #endregion #region 獲取遠程圖片 public Response GetImage(string sUrl) { return GetImage(sUrl, false, new Request()); } public Response GetImage(string sUrl, WebProxy proxy) { return GetImage(sUrl, false, new Request(), proxy); } public Response GetImage(string sUrl, string referer) { return GetImage(sUrl, false, referer, null); } public Response GetImage(string sUrl, string referer, WebProxy proxy) { return GetImage(sUrl, false, referer, proxy); } public Response GetImage(string sUrl, bool bAllowAutoRedirect, string referer) { return GetImage(sUrl, bAllowAutoRedirect, new Request(), referer, null); } public Response GetImage(string sUrl, bool bAllowAutoRedirect, string referer, WebProxy proxy) { return GetImage(sUrl, bAllowAutoRedirect, new Request(), referer, null); } //public Image GetImage(string sUrl, bool bAllowAutoRedirect, Request request) //{ // return GetImage(sUrl, bAllowAutoRedirect, request, new CookieContainer(), ""); ////} //public Image GetImage(string sUrl, bool bAllowAutoRedirect, Request request, string referer) //{ // return GetImage(sUrl, bAllowAutoRedirect, request,referer); //} /// <summary> /// 獲取遠程圖片 /// </summary> /// <param name="sUrl">圖片地址</param> /// <param name="bAllowAutoRedirect">是否自動跳轉</param> /// <param name="send">發送內容</param> /// <returns></returns> public Response GetImage(string sUrl, bool bAllowAutoRedirect, Request request) { return GetImage(sUrl, bAllowAutoRedirect, request, "", null); } public Response GetImage(string sUrl, bool bAllowAutoRedirect, Request request, string referer) { return GetImage(sUrl, bAllowAutoRedirect, request, referer, null); } public Response GetImage(string sUrl, bool bAllowAutoRedirect, Request request, WebProxy proxy) { return GetImage(sUrl, bAllowAutoRedirect, request, "", proxy); } /// <summary> /// 獲取遠程圖片 /// </summary> /// <param name="sUrl">圖片地址</param> /// <param name="bAllowAutoRedirect">是否自動跳轉</param> /// <param name="send">發送內容</param> /// <returns></returns> public Response GetImage(string url, bool bAllowAutoRedirect, Request request, string referer, WebProxy proxy) { Response response = new Response(); if (request.Method == Method.GET) { string sData = request.ToString(); if (sData.Length > 0) url = string.Format("{0}?{1}", url, sData); } HttpWebRequest httpRequest = (HttpWebRequest)WebRequest.Create(url); if (proxy != null) httpRequest.Proxy = proxy; #region SSL方式 if (url.Contains("https://")) { //這一句必定要寫在建立鏈接的前面。使用回調的方法進行證書驗證。 ServicePointManager.ServerCertificateValidationCallback = new System.Net.Security.RemoteCertificateValidationCallback(CheckValidationResult); //建立證書文件 X509Certificate objx509 = new X509Certificate(); //添加到請求裏 httpRequest.ClientCertificates.Add(objx509); } #endregion // 設置發送頭信息 if (referer.Length == 0) SetRequestHeader(ref httpRequest, new Uri(url).Host); else SetRequestHeader(ref httpRequest, referer); // 自動重定向 httpRequest.AllowAutoRedirect = bAllowAutoRedirect; // 關聯Cookies httpRequest.CookieContainer = this.Cookies; try { if (request.Method == Method.POST) { // 設置發送方式 httpRequest.Method = request.Method.ToString(); // 獲取發送數據流 //HttpWebResponse response = httpRequest.GetResponse() as HttpWebResponse; Stream strem = httpRequest.GetRequestStream(); // 寫入發送數據 byte[] bs = request.ToBytes(); strem.Write(bs, 0, bs.Length); strem.Close(); } HttpWebResponse httpResponse = httpRequest.GetResponse() as HttpWebResponse; Stream responseStream = httpResponse.GetResponseStream(); //if (responseStream.CanSeek) //{ response.Image = Image.FromStream(responseStream); //} //else //{ // response.Image = null; //} response.RemoteDateTime = Convert.ToDateTime(httpResponse.GetResponseHeader("Date")); this.Cookies.Add(httpResponse.Cookies); response.Cookies = this.Cookies; response.StatusCode = httpResponse.StatusCode; responseStream.Dispose(); responseStream.Close(); } catch (Exception ex) { if (this.Connection_TimeOut != null) this.Connection_TimeOut.Invoke(url, request, ex); } return response; } #endregion #region 異步獲取遠程HTML /// <summary> /// 異步獲取遠程HTML /// </summary> /// <param name="sUrl">地址</param> /// <returns></returns> public void BeginGetHTML(string sUrl) { BeginGetHTML(sUrl, false, new Request() { }); } /// <summary> /// 異步獲取遠程HTML /// </summary> /// <param name="sUrl">地址</param> /// <param name="send">是否自動重定向URL</param> /// <returns></returns> public void BeginGetHTML(string sUrl, bool bAllowAutoRedirect) { BeginGetHTML(sUrl, bAllowAutoRedirect, new Request() { }); } /// <summary> /// 異步獲取遠程HTML /// </summary> /// <param name="sUrl">地址</param> /// <param name="send">發送內容</param> /// <returns></returns> public void BeginGetHTML(string sUrl, Request request) { BeginGetHTML(sUrl, false, request); } /// <summary> /// 異步獲取遠程HTML /// </summary> /// <param name="sUrl">地址</param> /// <param name="bAllowAutoRedirect">是否自動跳轉</param> /// <param name="send">發送內容</param> /// <returns></returns> public void BeginGetHTML(string sUrl, bool bAllowAutoRedirect, Request request) { Response result = new Response(); if (request.Method == Method.GET) { string sData = request.ToString(); if (sData.Length > 0) sUrl = string.Format("{0}?{1}", sUrl, sData); } HttpWebRequest httpRequest = (HttpWebRequest)WebRequest.Create(sUrl); // 設置發送頭信息 SetRequestHeader(ref httpRequest, new Uri(sUrl).Host); // 自動重定向 httpRequest.AllowAutoRedirect = bAllowAutoRedirect; if (request.Method == Method.POST) { // 設置發送方式 httpRequest.Method = request.Method.ToString(); // 獲取發送數據流 Stream stream = httpRequest.GetRequestStream(); byte[] bs = request.ToBytes(); stream.Write(bs, 0, bs.Length); stream.Close(); //httpRequest.BeginGetRequestStream(new AsyncCallback(GetRequestStreamCallback),httpRequest); // 寫入發送數據 } //HttpWebResponse httpResponse = httpRequest.GetResponse() as HttpWebResponse; AsyncCallback callback = new AsyncCallback(GetResponseStreamCallback); try { httpRequest.BeginGetResponse(callback, httpRequest); } catch (WebException ex) { if (this.Connection_TimeOut != null) this.Connection_TimeOut.Invoke(sUrl, request, ex); } } private void GetRequestStreamCallback(IAsyncResult ar) { //Request request = ar.AsyncState as Request; //Stream stream = async.EndGetRequestStream(ar); //byte[] bs = request.ToBytes(); //stream.Write(bs, 0, bs.Length); //stream.Close(); } private void GetResponseStreamCallback(IAsyncResult ar) { HttpWebRequest httpRequest = ar.AsyncState as HttpWebRequest; HttpWebResponse httpResponse = httpRequest.EndGetResponse(ar) as HttpWebResponse; Stream responseStream = httpResponse.GetResponseStream(); Response response = new Response(); response.Html = GzipStreame(httpResponse.ContentEncoding, responseStream); response.RemoteDateTime = Convert.ToDateTime(httpResponse.GetResponseHeader("Date")); //response.Cookies = httpResponse.Cookies; if (this.Connection_Complete != null) this.Connection_Complete.Invoke(response); } #endregion }