From 08d2540a27939c0b8e4264d54abc06d1cfb08a27 Mon Sep 17 00:00:00 2001 From: boystray <67718273@qq.com> Date: Wed, 24 May 2017 23:20:00 +0800 Subject: [PATCH] Update lianjia.py MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 链家网站上的houselist位置发生的变化,更新xpath the xpath for houselist is changed in latest version of lianjia.com,so update xpath --- LianJia/LianJia/spiders/lianjia.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/LianJia/LianJia/spiders/lianjia.py b/LianJia/LianJia/spiders/lianjia.py index 5182f64..908b38d 100644 --- a/LianJia/LianJia/spiders/lianjia.py +++ b/LianJia/LianJia/spiders/lianjia.py @@ -24,7 +24,7 @@ def parse(self, response): headers = {'User-Agent': user_agent} lists = response.body.decode('utf-8') selector = etree.HTML(lists) - area_list = selector.xpath('/html/body/div[3]/div[2]/dl[2]/dd/div[1]/div/a') + area_list = selector.xpath('/html/body/div[3]/div[1]/dl[2]/dd/div[1]/div/a') for area in area_list: try: area_han = area.xpath('text()').pop() # 地点