37,719
社区成员
发帖
与我相关
我的任务
分享
import urllib.request
from lxml import etree
url = "http://sh.ganji.com/fang1/"
resp = urllib.request.urlopen(url).read()
mystr = resp.decode("utf-8") # 解码
print(mystr)
selector = etree.HTML(resp)
titles = selector.xpath('//*[@class="f-list-item ershoufang-list"]/dl/dd/a/text()')
prices = selector.xpath('//*[@class="price"]/span[1]/text()')
print("titleslen:", len(titles))
print("priceslen:", len(prices))
print(dict(zip(titles,prices)))
import requests
from lxml import etree
r = requests.get(url='http://sh.ganji.com/fang1/') # 最基本的GET请求
selector = etree.HTML(r.text)
titles = selector.xpath('//*[@class="f-list-item ershoufang-list"]/dl/dd/a/text()')
prices = selector.xpath('//*[@class="price"]/span[1]/text()')
print("titleslen:", len(titles))
print("priceslen:", len(prices))
for i,j in zip(titles,prices):
print(i, j)