From 3e05480a2183a64bd1ea21ac64690407b5d6d942 Mon Sep 17 00:00:00 2001 From: pwf8z3sai <2920734136@qq.com> Date: Sat, 23 Apr 2022 10:44:28 +0800 Subject: [PATCH] Add getdata.py --- getdata.py | 51 +++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 51 insertions(+) create mode 100644 getdata.py diff --git a/getdata.py b/getdata.py new file mode 100644 index 0000000..09660ac --- /dev/null +++ b/getdata.py @@ -0,0 +1,51 @@ +# -*-coding:UTF-8-*- +'''根据行政区域查询''' +import json +import csv +import sys +import requests # 导入requests库,这是一个第三方库,把网页上的内容爬下来用的 + +ty = sys.getfilesystemencoding() +import time + +las = 1 # 给las一个值1 +ak = '您申请的KEY码' +out = open('j_str.csv', 'a', newline='') +csv_write = csv.writer(out, dialect='excel') +print(time.time()) +print('开始') +urls = [] # 声明一个数组列表 +que = '' \ + '避险场所' +ta = '露天停车场' +for i in range(0, 20): + page_num = str(i) + url = 'https://mp.weixin.qq.com/s/K0u_qPFQtWuH4hk5K2xWfQ' + que + '&' \ + 'tag=' + ta + '®ion=郑州&page_size=20&page_num=' + str( + page_num) + '&output=json&ak=' + ak + urls.append(url) +print('url列表读取完成') +for url in urls: + time.sleep(5) # 为了防止并发量报警,设置了一个5秒的休眠。 + print(url) + html = requests.get(url) # 获取网页信息 + data = html.json() # 获取网页信息的json格式数据 + print(data) + for item in data['results']: + jname1 = item['province'] + jname2 = item['city'] + jname3 = item['area'] + jname4 = item['name'] + jname = jname1 + jname2 + jname3 + jname4 + j_uid = item['uid'] + jstreet_id = item.get('street_id') + jlat = item['location']['lat'] + jlon = item['location']['lng'] + jaddress = item['address'] + jphone = item.get('telephone') + j_str = (jname, j_uid, jstreet_id, str(jlat), str(jlon), jaddress, jphone) + print(j_str) + csv_write.writerow(j_str) + print("write over") + print(time.time()) +print('完成')