asp.net C# 获取网页源码的几种方式
System.Net.WebClient aWebClient = new System.Net.WebClient(); aWebClient.Encoding = System.Text.Encoding.Default; Byte[] pageData = aWebClient.DownloadData(url); string nhtml = Encoding.GetEncoding("utf-8").GetString(pageData);
2方法
System.Net.WebClient aWebClient = new System.Net.WebClient(); aWebClient.Encoding = System.Text.Encoding.Default; string nhtml = aWebClient.DownloadString(goodstidurl);
3方法
WebBrowser webbrowser = new WebBrowser(); StreamReader sr = new StreamReader(this.webBTaobao.DocumentStream, Encoding.Default); html = sr.ReadToEnd(); html = html.Replace("\r\n", ""); html = html.Replace("\n", ""); html = html.Replace(" ", ""); html = html.Replace("(", ""); html = html.Replace(")", ""); string nurl = Regex.Match(html, "(?<=data-url=\").*?(?=\")").Value; //新建一个WebBrowser WebBrowser webAddress = new WebBrowser(); webAddress.Navigate(nurl); //等待加载完成 while (webAddress.ReadyState < WebBrowserReadyState.Complete) Application.DoEvents(); StreamReader sraddress = new StreamReader(webAddress.DocumentStream, Encoding.Default); jsonaddress = sraddress.ReadToEnd();
4方法
WebRequest hwr = WebRequest.Create(@"http://item.taobao.com/item.htm?id=" + row["urlId"].ToString());//向指定Url发出请求 HttpWebResponse hwp = hwr.GetResponse() as HttpWebResponse;//将hwr对HTTP的请求 string text; StreamReader sr; string code = hwp.ContentType;//请求响应得到的内容类型 //得到编码了 code = code.Split('=')[1]; Stream rep = hwp.GetResponseStream();//将请求得到的内容以流的形式读出 sr = new StreamReader(rep, Encoding.GetEncoding(code));//用指定的字符编码为指定的流初始化
郑重声明:本站内容如果来自互联网及其他传播媒体,其版权均属原媒体及文章作者所有。转载目的在于传递更多信息及用于网络分享,并不代表本站赞同其观点和对其真实性负责,也不构成任何其他建议。