python_爬蟲爬取庫房無憂網的庫房數量

原創不易,轉發請帶本文鏈接
爬蟲爬取庫房無憂網每個城市的庫房數量
爬取前請到高德地圖找到自己城市的起始經緯度和終止經緯度

import os

import requests
from utils.read_write import writeOneCSV, writeOneJSON, readJson

'''
    此文件用於抓取庫房無憂網的庫房數據
'''
headers = {
    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko)'
                  ' Chrome/49.0.2623.221 Safari/537.36 SE 2.X MetaSr 1.0'}
os.chdir(r'D:\project\jianguiyuan\\')

def count(district, houseType):
    url = 'http://sz.kufangwuyou.com/house/count'
    data = {
        "level": 3,
        "houseType": "5",
        "city": "440300",
        "start": 0,
        "pageSize": 1000,
        "longitudeStart": 113.33913,
        "latitudeStart": 22.046212,
        "longitudeEnd": 114.83276,
        "latitudeEnd": 23.045959
    }
    r = requests.post(url, headers=headers, json=data)
    response = r.json()
    if response['result']['data']:
        file = str(houseType) + '_' + str(district) + '_' + '.json'
        writeOneJSON(response['result'], json_dir + file )


if __name__ == "__main__":
    json_dir = 'D:\data\深圳政府數據\深圳庫房數據\count\json\level3\\'
    child_json = 'data\\child.json'
    child = readJson(child_json)
    result = child['result']
    for houseType in [1, 2, 5]:
        for one in result:
            district = one['areaId']
            # street = one['child']['areaId']
            count(district, houseType)

如需幫忙抓取數據,請私聊我,我這暫時只有深圳的

發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章