|
马上注册,结交更多好友,享用更多功能^_^
您需要 登录 才可以下载或查看,没有账号?立即注册
x
本帖最后由 L嘉 于 2020-8-5 20:26 编辑
@Twilight6- # -*- coding: utf-8 -*-
- from lxml import etree
- import requests
- import csv
- import time
- def writecsv(item):
- with open('ershou.csv','a',encoding = 'utf-8') as f:
- writer = csv.writer(f)
- try:
- writer.writerow(item)
- except:
- print('write error!')
-
- if __name__ == '__main__':
- headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.92 Safari/537.3'}
-
- start_url = 'https://cd.ke.com/ershoufang/damian/pg'
- for x in range(1,76):
- url = start_url + str(x)
- html = requests.get(url,headers = headers)
- time.sleep(3)
- selector = etree.HTML(html.text)
-
- #小区列表
- xiaoqulist = selector.xpath('//*[@id="beike"]/div[1]/div[4]/div[1]/div[4]/ul/li')
- for xiaoqu in xiaoqulist:
-
- #楼盘名
- mingcheng = xiaoqu.xpath('div/div[2]/div[1]/div/a/text()')[0]
-
- #楼盘信息
- xinxi = xiaoqu.xpath('div/div[2]/div[2]/text()')[1]
-
- #均价
- junjia = xiaoqu.xpath('div/div[2]/div[5]/div[2]/span/text()')[0]
-
- #总价
- zongjia = xiaoqu.xpath('//div/div[5]/div[@class="totalPrice"]/span/text()')[0]
-
-
- item = [mingcheng, xinxi, junjia, zongjia]
- writecsv(item)
- print('londing:',mingcheng)
-
复制代码
试试看?
- # -*- coding: utf-8 -*-
- from lxml import etree
- import requests
- import csv
- import time
- def writecsv(item):
- with open('ershou.csv', 'a', encoding='utf-8') as f:
- writer = csv.writer(f)
- writer.writerow(item)
- if __name__ == '__main__':
- headers = {
- 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.92 Safari/537.3',
- 'referer':'https://cd.ke.com/ershoufang/damian/pg/'}
- start_url = 'https://cd.ke.com/ershoufang/damian/pg'
- for x in range(1, 76):
- url = start_url + str(x)
- html = requests.get(url, headers=headers)
- time.sleep(3)
- selector = etree.HTML(html.text)
- headers['referer'] = f'https://cd.ke.com/ershoufang/damian/pg{x-1}/'
- # 小区列表
- xiaoqulist = selector.xpath('//*[@id="beike"]/div[1]/div[4]/div[1]/div[4]/ul/li')
- for xiaoqu in xiaoqulist:
- # 楼盘名
- mingcheng = xiaoqu.xpath('div/div[2]/div[1]/div/a/text()')[0]
- # 楼盘信息
- xinxi = xiaoqu.xpath('div/div[2]/div[2]/text()')[1]
- # 均价
- junjia = xiaoqu.xpath('div/div[2]/div[5]/div[2]/span/text()')[0]
- # 总价
- zongjia = xiaoqu.xpath('//div/div[5]/div[@class="totalPrice"]/span/text()')[0]
- item = [mingcheng, xinxi, junjia, zongjia]
- writecsv(item)
- print('londing:', mingcheng)
复制代码
|
|