抓取一网页的数据,但这个网页需要登录后才能获得页面数据
问题是这样,我需要抓取一网页的数据,但这个网页需要登录后才能获得页面数据
具体需求:
有一登录页面 a
输入用户名,密码后,登录进入的页面b ,在b页面有一个查询框,输入关键字后可以查到要的资料
现在我想要抓取输入关键字后查到的这个资料????
a页面HTML代码:
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<HTML xmlns="http://www.w3.org/1999/xhtml" >
<HEAD>
<title></title>
<meta content="Microsoft Visual Studio 7.0" name="GENERATOR">
<meta content="C#" name="CODE_LANGUAGE">
<meta content="JavaScript" name="vs_defaultClientScript">
<meta content="http://schemas.microsoft.com/intellisense/ie5" name="vs_targetSchema">
<style type="text/css">
.box { BORDER-RIGHT: #00000e 1px solid; BORDER-TOP: #00000e 1px solid; BORDER-LEFT: #00000e 1px solid; WIDTH: 95px; COLOR: black; BORDER-BOTTOM: #00000e 1px solid; FONT-FAMILY: "Verdana", "Arial", "Helvetica", "sans-serif"; HEIGHT: 18px }
</style>
</HEAD>
<body background="Images/bg.jpg" style="font-family:宋体; font-size:12px;">
<form name="Form1" method="post" action="Default.aspx" id="Form1" onsubmit="return CheckForm()">
<div>
<input type="hidden" name="__LASTFOCUS" id="__LASTFOCUS" value="" />
<input type="hidden" name="__EVENTTARGET" id="__EVENTTARGET" value="" />
<input type="hidden" name="__EVENTARGUMENT" id="__EVENTARGUMENT" value="" />
<input type="hidden" name="__VIEWSTATE" id="__VIEWSTATE" value="/wEPDwUKLTM4NDEzMjcxOA9kFgICAQ9kFgQCAQ9kFgJmD2QWAmYPZBYCAgEPEGRkFgFmZAIDDxYCHgdWaXNpYmxlaGRku2Xu3swCz7Do+clUU0V1cnHylvQ=" />
</div>
<script type="text/javascript">
//<![CDATA[
var theForm = document.forms['Form1'];
if (!theForm) {
theForm = document.Form1;
}
function __doPostBack(eventTarget, eventArgument) {
if (!theForm.onsubmit || (theForm.onsubmit() != false)) {
theForm.__EVENTTARGET.value = eventTarget;
theForm.__EVENTARGUMENT.value = eventArgument;
theForm.submit();
}
}
//]]>
</script>
<script src="/Web/WebResource.axd?d=VL6BGXIlsSRn1JfExdojlQ2&t=633911728051406250" type="text/javascript"></script>
<script src="/Web/WebResource.axd?d=899UgtWKK1ld1MgTOEjycQ2&t=633911728051406250" type="text/javascript"></script>
<div>
<input type="hidden" name="__EVENTVALIDATION" id="__EVENTVALIDATION" value="/wEWCgK8trP/CAKJm9GxDwLnrY36DgL6/rDvCQLlpoTSDALC7/GkAwKQ6qicBQKl1bK4CQK1qbSRCwLCi9reAwJ38okiwmFdHJ81o5upMrWijfO/" />
</div>
<script language="javascript">
function CheckForm()
{
return true;
if(Form1.txtUsername.value == "")
{
alert("用户名不可为空!");
return false;
}
if(Form1.txtPassword.value == "")
{
alert("密码不可为空!");
return false;
}
return true;
}
function OnSubmit()
{
document.getElementById("Form1").action="http://localhost/webtest/default.aspx";
document.all.__VIEWSTATE.value = "/wEPDwULLTE3MjkyOTU5NTgPZBYCAgEPZBYCAgMPFgIeB1Zpc2libGVoZGRMic+N6noF8f8g3IIOTEa0lsUeBw==";
}
</script>
<TABLE height="100%" cellSpacing="0" cellPadding="0" width="100%" border="0">
<TBODY>
<tr>
<td style="HEIGHT: 472px">
<table id="tableLogin" align="center" cellspacing="0" cellpadding="0" width="550" height="264" background="Images/main.jpg" border="1" bordercolor="#000099">
<tr>
<TD><DIV align="center">
<TABLE cellSpacing="0" cellPadding="2" width="100%" border="0">
<TBODY align="center">
<TR align="center">
<TD style="height: 35px">
</TD>
<TD width="150" style="height: 35px"></TD>
<TD width="78" style="height: 35px">
</TD>
</TR>
<TR align="center">
<TD style="height: 32px">
<p align="right">
系 统:
</p>
</TD>
<TD width="150">
<select name="ddlSystem" onchange="javascript:setTimeout('__doPostBack(\'ddlSystem\',\'\')', 0)" id="ddlSystem" style="width:152px;">
<option selected="selected" value="A">A</option>
<option value="B">B</option>
<option value="C">C</option>
<option value="D">D</option>
<option value="E">E</option>
</select></TD>
<TD width="78" style="height: 32px">
</TD>
</TR>
<TR align="center">
<TD>
<p align="right">用户名:
</p>
</TD>
<TD width="150">
<input name="txtUsername" type="text" id="txtUsername" class="box" style="width:150px;" /></TD>
<TD width="78">
</TD>
</TR>
<TR>
<TD>
<p align="right">密 码:
</p>
</TD>
<TD width="150">
<input name="txtPassword" type="password" id="txtPassword" class="box" style="width:150px;" /></TD>
<TD width="78">
<input type="submit" name="btnSubmit" value="登录" id="btnSubmit" style="color:White;background-color:#8080FF;width:60px;" /></TD>
</TR>
</TBODY>
</TABLE>
</DIV>
</TD>
</tr>
</table>
</TD>
</TR>
</TBODY>
</TABLE>
<script type="text/javascript">
//<![CDATA[
WebForm_AutoFocus('txtUsername');//]]>
</script>
</form>
</body>
</HTML>