爬虫爬取中国最好大学这个网页得出中国最好大学的排名,初入python,谢谢大佬
import requests
from bs4 import BeautifulSoup
import bs4
def getHTmlText(url):
try:
r = requests.get(url, timeout=30)
r.raise_for_status()
r.encoding = r.apparent_encoding
return r.text
except:
return ""
def fillUnivList(ulist, html):
soup = BeautifulSoup(html, "html.parser")
for tr in soup.find('tbody').children:
if isinstance(tr, bs4.element.Tag):
tds = tr('td')
ulist.append([tds[0].string, tds[1].string, tds[2].string])
def printUnivList(ulist, num):
tplt = "{0:^10}\t{1:{3}^10}\t{2:^10}"
print(tplt.format("排名","学校名称","总分",chr(12288)))
for i in range(num):
u = ulist[i]
print(tplt.format(u[0],u[1],u[2],chr[12288]))
def main():
uinfo = []
url = 'http://www.zuihaodaxue.cn/zuihaodaxuepaiming2017.html'
html = getHTmlText(url)
fillUnivList(uinfo,html)
printUnivList(uinfo,20)
main()
以下是error(共三处):
Traceback (most recent call last):
File "G:/Python练习/untitled1/爬虫中国大学排名.py", line 38, in <module>
main()
File "G:/Python练习/untitled1/爬虫中国大学排名.py", line 37, in main
printUnivList(uinfo,20)
File "G:/Python练习/untitled1/爬虫中国大学排名.py", line 29, in printUnivList
print(tplt.format(u[0],u[1],u[2],chr[12288]))
TypeError: 'builtin_function_or_method' object is not subscriptable
排名 学校名称 总分
Process finished with exit code 1
番外:请大佬指教,初入python,谢谢