2013-05-01 21:42

[C#] 取得 URL 頁面上的 title 內容

  1. //using System.Net; 
  2. //using System.IO; 
  3. //using System.Text; 
  4.  
  5. string url = @"http://msdn.microsoft.com/en-us/library/az24scfc.aspx"; 
  6. string title = String.Empty; 
  7.  
  8. WebResponse response = null; 
  9. WebRequest request = WebRequest.Create(url); 
  10.  
  11. /*設定最長執行的毫秒數*/ 
  12. request.Timeout = 10000;  
  13.  
  14. try{ 
  15.    /*取得 URL 頁面資料*/ 
  16.    response = request.GetResponse(); 
  17.    StreamReader stream = new StreamReader( 
  18.        response.GetResponseStream(), Encoding.UTF8 
  19.    ); 
  20.  
  21.    /*只取得前 4096 個字*/ 
  22.    char[] buf = new char[4096]; 
  23.    stream.Read(buf, 0, buf.Length); 
  24.  
  25.    /*尋找標題字串*/ 
  26.    string pageText = new String(buf); 
  27.    string pattern = @"(?<=<title[^>]*>)([^<]*)(?=</title>)"; 
  28.    title = Regex.Match(pageText, pattern, RegexOptions.IgnoreCase) 
  29.            .Value.Trim(); 
  30.  
  31. }catch(WebException e){ 
  32. }finally{ 
  33.    if(response!=null){ response.Close(); } 
  34. } 
  35.  
  36. title.Dump(); 

0 回應: