37,720
社区成员
发帖
与我相关
我的任务
分享
#-*-coding:utf8-*-
import requests
import sys
from lxml import etree
reload(sys)
sys.setdefaultencoding('gbk')
url='http://www.jikexueyuan.com/course/902_2.html?ss=1'
html =requests.get(url)
selector = etree.HTML(html.content)
#提取文本
content = selector.xpath('//*[@id="pager"]/div[3]/div[2]/div[2]/ul/li[1]/div/h2/a/text()')
print content
for each in content:
print each
reload(sys)
sys.setdefaultencoding('gbk')
不要再调用setdefaultencoding了,python3里面取消了这个功能