class Spider(object):
def Get(cls,url,pattern):
info = requests.get(url).content
result = re.findall(pattern,info)
for i in result:
print i
return result
MySpider =Spider()
result = MySpider.Get('http://www.xiachufang.com/',u"<a href=\"(.*?)title=\"(.*?)\" .*><span")
print info 可以正常显示中文
可是result中文都显示成了\xe4\xb8\x80\xe7\xa2\x97\xe7\xba\xa2\xe8\xb1\x86\xe6\xb2\x99
研究一天了,头都痛