private string getWebresourceFile1 ( string url )
{ WebClient myWebClient = new WebClient ( );
byte[] myDataBuffer = myWebClient.DownloadData ( url );
string SourceCode = Encoding.UTF8.GetString ( myDataBuffer );
return SourceCode;
}
我不知道你要读什么,这代码是读取该网页的源代码
{ WebClient myWebClient = new WebClient ( );
byte[] myDataBuffer = myWebClient.DownloadData ( url );
string SourceCode = Encoding.UTF8.GetString ( myDataBuffer );
return SourceCode;
}
我不知道你要读什么,这代码是读取该网页的源代码
怎么可能读不出来 。 我看了一下,能读出来,而且超简单。 并没有防采集。
我这里有一段自己写的 采集程序:/// <summary>
/// 请求失败的时候,反复操作
/// </summary>
/// <param name="PageUrl"></param>
/// <returns></returns>
public string ToServer(string PageUrl)
{
string responseFromServer = "";
try
{
while (1 == 1)
{
WebRequest request = WebRequest.Create(PageUrl);
WebProxy wp = new WebProxy(al[proxy].ToString(), true);
request.Proxy = wp;
request.Timeout = 1000 * 45; HttpWebResponse response = (HttpWebResponse)request.GetResponse();
Stream dataStream = response.GetResponseStream();
StreamReader reader=null;
reader = new StreamReader(dataStream, System.Text.Encoding.Default);
responseFromServer = reader.ReadToEnd();
reader.Close();
dataStream.Close();
response.Close();
if (responseFromServer.Contains("refresh") || responseFromServer == "")
{
proxy++;
if (proxy >= al.Count)
{
al = ReadIPproxy("e:\\test.txt");//初始化代理 IP
}
//ToServer(PageUrl);
}
else
{
break;
}
}
}
catch (WebException ex)
{
if (ex.Status == WebExceptionStatus.ProtocolError)
{
responseFromServer = "";
}
else
{
proxy++;
if (proxy >= al.Count)
{
al = ReadIPproxy("e:\\test.txt");//初始化代理 IP
}
ToServer(PageUrl);
}
}
return responseFromServer;
}
using System;
using System.Collections;
using System.ComponentModel;
using System.Data;
using System.Drawing;
using System.Web;
using System.Web.SessionState;
using System.Web.UI;
using System.Web.UI.WebControls;
using System.Web.UI.HtmlControls;
using System.IO;
using System.Net;
using System.Text;
using System.Text.RegularExpressions;public partial class _Default : System.Web.UI.Page
{
protected void Page_Load(object sender, EventArgs e)
{
Response.Write ("what is this?");
Response.Write(ToServer("http://www.qidian.com/Book/BookStore.aspx"));
} public string ToServer(string PageUrl)
{
string responseFromServer = ""; try
{
WebRequest request = WebRequest.Create(PageUrl);
HttpWebResponse response = (HttpWebResponse)request.GetResponse();
Stream dataStream = response.GetResponseStream();
StreamReader reader = null; reader = new StreamReader(dataStream, System.Text.Encoding.Default);
responseFromServer = reader.ReadToEnd(); reader.Close();
dataStream.Close();
response.Close();
}
catch (WebException ex)
{
} return responseFromServer;
}}经过测试,http://www.qidian.com/Book/BookStore.aspx 网页的内容还是保存不回来,其它的网站都可以;