1.
private string getHtml(string url)
{
WebClient myWebClient = new WebClient();
byte[] myDataBuffer = myWebClient.DownloadData (url);
return Encoding.Default.GetString(myDataBuffer);
}
2.
public string getHttp(string HttpUrl,string RefererUrl)
{
string html = "";
try
{
MSXML2.XMLHTTP Http = new MSXML2.XMLHTTPClass();
Http.open("GET",HttpUrl,false,"admin","admin");
Http.setRequestHeader("Referer",RefererUrl);
//Http.setRequestHeader("Referer",RefererUrl);
Http.setRequestHeader("Content-Type", "text/html;charset=gb2312");
Http.send("");
html = Encoding.Default.GetString((byte[])Http.responseBody);
Http = null;
}
catch
{
}
return html;
}
本文介绍了两种不同的网页内容抓取方法。第一种方法使用WebClient类下载网页内容,并将其转换为字符串。第二种方法通过MSXML2.XMLHTTP发送HTTP请求,设置Referer头和Content-Type,获取并返回网页源代码。
889

被折叠的 条评论
为什么被折叠?



