110,530
社区成员
发帖
与我相关
我的任务
分享
string str="<tr height=\"23\" class=\"listrow2\">\n <td>\n <div align=\"center\">\n <img "
+"height=\"9\" width=\"10\"\n src=\"/public/search/zbw/images/cio_pic.jpg\" "
+"/>\n <!-- <img height=\"9\" width=\"10\"\n "
+"src=\"http://www.baidu.com/zbw/images/cio_pic.jpg\" /> -->\n </div>\n <input "
+"type=\"hidden\" value=\"VIPXM\" name=\"table_nam"
+"e2\">\n </td>\n <td>\n <a target=\"_blank\" "
+"href=\"http://www.baidu.com/cblcn/InfoShow/zbgg?record_id=BwRe\">标题a</a>\n "
+"</td>\n <td>\n 2012-04-06\n </td>\n </tr>\n <tr>\n <td height=\"3\" "
+"background=\"/public/search/zbw/images/cio.jpg\"\n class=\"tit_bg\" "
+"colspan=\"3\">\n <!-- background=\"http://www.baidu.com/zbw/images/cio.jpg\" "
+"-->\n </td>\n </tr>\n \n <tr height=\"23\" class=\"listrow1\">\n <td>\n "
+" <div align=\"center\">\n <img height=\"9\" width=\"10\"\n "
+"src=\"/public/search/zbw/images/cio_pic.jpg\" />\n <!-- <img height=\"9\" "
+"width=\"10\"\n src=\"http://www.baidu.com/zbw/images/cio_pic.jpg\" /> -->\n "
+"</div>\n <input type=\"hidden\" value=\"VIPXM\" name=\"table_name2\">\n "
+"</td>\n <td>\n <a target=\"_blank\" "
+"href=\"http://www.baidu.com/cblcn/InfoShow/zbgg?record_id=BwRU\">标题b</a>\n "
+"</td>\n <td>\n 2012-04-06\n </td>\n </tr>\n <tr>\n <td height=\"3\" background=\"/public/search/zbw/images/cio.jpg\"\n class=\"tit_bg\" "
+"colspan=\"3\">\n <!-- background=\"http://www.baidu.com/zbw/images/cio.jpg\" "
+ "-->\n </td>\n </tr>\n \n ";
Regex reg = new Regex(@"<td>\s*<a[^>]*?href=(['""\s]?)(?<url>[^'""\s]+)\1[^>]*?>(?<text>.*?)</a>\s*</td>\s*<td>\s*(?<date>\d{4}-\d{2}-\d{2})\s*</td>");
foreach (Match m in reg.Matches(str))
Console.WriteLine("{0} {1} {2}", m.Groups["url"].Value, m.Groups["text"].Value, m.Groups["date"].Value);
/*
http://www.baidu.com/cblcn/InfoShow/zbgg?record_id=BwRe 标题a 2012-04-06
http://www.baidu.com/cblcn/InfoShow/zbgg?record_id=BwRU 标题b 2012-04-06
*/