取网页的源码~~~

来源:互联网 发布:泡利矩阵 编辑:程序博客网 时间:2024/05/20 03:42

方法一:

 public  System.Text.StringBuilder GetPageSource(string url)
  {
   HttpWebRequest request = (HttpWebRequest) WebRequest.Create(url);
   request.Timeout = 15000;
   request.KeepAlive = false;
   StreamReader sr = null;
   HttpWebResponse response = null;
   Stream res = null;
   System.Text.StringBuilder sb = new StringBuilder();
   try
   {
    response = (HttpWebResponse) request.GetResponse();
    res = response.GetResponseStream();
    sr = new StreamReader(res,System.Text.Encoding.Default);
    sb.Append(sr.ReadToEnd().ToLower());
   }
   catch
   {  }
   finally
   {
    if(sr!=null)
     sr.Close();
    if(res!=null)
     res.Close();
   }
   return sb;
  }

方法二:

 public  StringBuilder GetPageXML(string url,string startStr,string endStr)
  {
   System.Text.StringBuilder sb = new StringBuilder();
   baseClass bc = new baseClass();
   try
   {
    MSXML2.XMLHTTP60Class  _xmlhttp = new MSXML2.XMLHTTP60Class();
    _xmlhttp.open("GET",url,false,null,null);
    _xmlhttp.setRequestHeader("CONTENT-TYPE","text/xml;charset=gb2312");         
    _xmlhttp.setRequestHeader("USER-AGENT","China89bot/1.0+(+http://www.55125.cn/bots/bot.html)Sam/20070205");           
    _xmlhttp.send("");
    if(_xmlhttp.status==200)
    {
     string str = System.Text.Encoding.GetEncoding("gb2312").GetString((byte[])_xmlhttp.responseBody);
     sb.Append(cutString(str.ToLower(),startStr,endStr));
    }
    else
    {
     sb.Append("");
    }
   }
   catch
   { sb.Append(""); }
   return sb;
  }