python抓取WEB页面
retval=urlretrieve(url)[0] 不知道是什么意思 能不能解释下
from urllib import urlretrieve
def firstNonBlank(lines):
for eachline in lines:
if not eachline.strip():
continue
else:
return eachline
def firstlast(webpage):
f=open(webpage)
lines=f.readlines()
f.close()
print firstNonBlank(lines),
lines.reverse()
print firstNonBlank(lines),
def download(url='http://www.xiaonei.com',
process=firstlast):
try:
retval=urlretrieve(url)[0]
except IOError:
retval=None
if retval:
process(retval)
if __name__=='__main__':
download()