/// <summary>
/// 获取指定URL网页的HTML代码
/// </summary>
/// <param name="URL">URL</param>
/// <param name="charset">网页编码 如 gb2312,utf-8</param>
/// <returns>HTML代码</returns>
public static string GetPageSource(string URL,string charset)
{
Uri uri =new Uri(URL);
HttpWebRequest hwReq = (HttpWebRequest)WebRequest.Create(uri);
HttpWebResponse hwRes = (HttpWebResponse)hwReq.GetResponse();
hwReq.Method = "Get";
hwReq.KeepAlive = false;
StreamReader reader = new StreamReader(hwRes.GetResponseStream(),System.Text.Encoding.GetEncoding(charset));
return reader.ReadToEnd();
}
//
public static MatchCollection GetNewsLink(string Htmlstr,string Restr)
{
Regex reNewsLink = new Regex(Restr,System.Text.RegularExpressions.RegexOptions.Singleline);
MatchCollection tem = reNewsLink.Matches(Htmlstr);
return tem;
}