网页源代码截取
using System;
using System.Collections.Generic;
using System.ComponentModel;
using System.Data;
using System.Drawing;
using System.Text;
using System.Windows.Forms;
using System.Net;
using System.IO;
namespace WindowsApplication2
{
public partial class Form1 : Form
{
public Form1()
{
InitializeComponent();
}
private void button1_Click(object sender, EventArgs e)
{
System.Net.HttpWebRequest req;
System.Net.HttpWebResponse res;
string url = "http://www.baidu.com";
req = (System.Net.HttpWebRequest)System.Net.WebRequest.Create(url);
res = (System.Net.HttpWebResponse)req.GetResponse();
System.IO.StreamReader strm = new System.IO.StreamReader(res.GetResponseStream(), Encoding.GetEncoding("gb2312"));
richTextBox1.Text = strm.ReadToEnd();
}
}
}
我现在得到了网页里的源代码,我想提取有用的。
如<title><</title>直接的。
这个如何写呀?