110,539
社区成员
发帖
与我相关
我的任务
分享
//获取指定字符串
private string GetPaperName(string strHTML)
{
Regex re = new Regex("(?<=<meta name=\"citation_title\" content=\").*\b");
Match ma = re.Match(strHTML);
string strName = ma.Value.ToString();
return strName;
}
//获取网页源码
private string GetHttpWebRequest(string url)
{
Uri uri = new Uri(url);
HttpWebRequest myReq = (HttpWebRequest)WebRequest.Create(uri);
myReq.UserAgent = "User-Agent:Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.2; .NET CLR 1.0.3705";
myReq.Accept = "*/*";
myReq.KeepAlive = true;
myReq.Headers.Add("Accept-Language", "zh-cn,en-us;q=0.5");
HttpWebResponse result = (HttpWebResponse)myReq.GetResponse();
Stream receviceStream = result.GetResponseStream();
StreamReader readerOfStream = new StreamReader(receviceStream, System.Text.Encoding.GetEncoding("utf-8"));
string strHTML = readerOfStream.ReadToEnd();
readerOfStream.Close();
receviceStream.Close();
result.Close();
return strHTML;
}
//获取指定字符串
private string GetPaperName(string strHTML)
{
Regex re = new Regex("(?<=<meta name=\"citation_title\" content=\").*?(?=\")");
Match ma = re.Match(strHTML);
return ma.Success?ma.Value:"";
}