一份完美的封装成函数的爬取并存储国内疫情概况的代码

dev_kfq
Chinaholmesfans 5 years ago
parent 1dab372b20
commit 423815b295

@ -1,12 +1,12 @@
import re
import json
import requests
import pymysql
import datetime
##################################################################################################
#爬取数据
# 国内疫情数据概况
class InsideSummary:
#######################################################################################################################
#爬取国内疫情数据概况
def InsideSummary():
class class_InsideSummary:
def __init__(self):
self.curConfirm = 0 # 现有确诊
self.curConfirmRelative = 0 # 较昨日新增确诊
@ -25,29 +25,30 @@ class InsideSummary:
self.died = 0 # 累计死亡
self.diedRelative = 0 # 较昨日累计死亡新增
self.updatedTime = 0 # 发布时间
# 数据库接口
# 返回元组
def get_inside_summary_tuple(self):
return ((self.curConfirm, self.curConfirmRelative, self.asymptomatic, self.asymptomaticRelative, \
self.unconfirmed, self.unconfirmedRelative, self.icu, self.icuRelative, self.confirmed, \
self.confirmedRelative, self.overseasInput, self.overseasInputRelative, self.cured, self.curedRelative, \
self.confirmedRelative, self.overseasInput, self.overseasInputRelative, self.cured,
self.curedRelative, \
self.died, self.diedRelative, self.updatedTime))
# 输出接口
def __str__(self):
return '%s %s %s %s %s %s %s %s %s %s %s %s %s %s %s %s %s' % (
self.curConfirm, self.curConfirmRelative, self.asymptomatic, self.asymptomaticRelative, self.unconfirmed,
self.curConfirm, self.curConfirmRelative, self.asymptomatic, self.asymptomaticRelative,
self.unconfirmed,
self.unconfirmedRelative, self.icu, self.icuRelative, self.confirmed, self.confirmedRelative,
self.overseasInput, self.overseasInputRelative, self.cured, self.curedRelative, self.died, self.diedRelative,
self.overseasInput, self.overseasInputRelative, self.cured, self.curedRelative, self.died,
self.diedRelative,
self.updatedTime)
#######################################################################################################
#业务逻辑类
# 爬取国内疫情数据
def get_text():# 爬取国内疫情数据文本
res = requests.get('https://view.inews.qq.com/g2/getOnsInfo?name=disease_h5')
#解码
res = res.content.decode('utf-8')
dict = json.loads(res) # str->dict
# 规范数据
for key in dict:
try:
@ -55,70 +56,72 @@ for key in dict:
key = key.replace('\\', '')
except:
pass
#新生成data字典
data = json.loads(dict['data'])
# 国内疫情数据实例化
# # #赋值
def fetch_inside_summary(data):
insideSummary = InsideSummary()
insideSummary.curConfirm = int(data['chinaTotal']['nowConfirm'])
insideSummary.curConfirmRelative = int(data['chinaAdd']['nowConfirm'])
insideSummary.asymptomatic = int(data['chinaTotal']['noInfect'])
insideSummary.asymptomaticRelative = int(data['chinaAdd']['noInfect'])
insideSummary.unconfirmed = int(data['chinaTotal']['suspect'])
insideSummary.unconfirmedRelative = int(data['chinaAdd']['suspect'])
insideSummary.icu = int(data['chinaTotal']['nowSevere'])
insideSummary.icuRelative = int(data['chinaAdd']['nowSevere'])
insideSummary.confirmed = int(data['chinaTotal']['confirm'])
insideSummary.updatedTime = data['lastUpdateTime']
insideSummary.confirmedRelative = int(data['chinaAdd']['confirm'])
insideSummary.overseasInput = int(data['chinaTotal']['importedCase'])
insideSummary.overseasInputRelative = int(data['chinaAdd']['importedCase'])
insideSummary.cured = int(data['chinaTotal']['heal'])
insideSummary.curedRelative = int(data['chinaAdd']['heal'])
insideSummary.died = int(data['chinaTotal']['dead'])
insideSummary.diedRelative = int(data['chinaAdd']['dead'])
return data
# 国内疫情数据赋值
def fetch_inside_summary():
dataf=get_text()
insideSummary = class_InsideSummary()
insideSummary.curConfirm = int(dataf['chinaTotal']['nowConfirm'])
insideSummary.curConfirmRelative = int(dataf['chinaAdd']['nowConfirm'])
insideSummary.asymptomatic = int(dataf['chinaTotal']['noInfect'])
insideSummary.asymptomaticRelative = int(dataf['chinaAdd']['noInfect'])
insideSummary.unconfirmed = int(dataf['chinaTotal']['suspect'])
insideSummary.unconfirmedRelative = int(dataf['chinaAdd']['suspect'])
insideSummary.icu = int(dataf['chinaTotal']['nowSevere'])
insideSummary.icuRelative = int(dataf['chinaAdd']['nowSevere'])
insideSummary.confirmed = int(dataf['chinaTotal']['confirm'])
insideSummary.updatedTime = dataf['lastUpdateTime']
insideSummary.confirmedRelative = int(dataf['chinaAdd']['confirm'])
insideSummary.overseasInput = int(dataf['chinaTotal']['importedCase'])
insideSummary.overseasInputRelative = int(dataf['chinaAdd']['importedCase'])
insideSummary.cured = int(dataf['chinaTotal']['heal'])
insideSummary.curedRelative = int(dataf['chinaAdd']['heal'])
insideSummary.died = int(dataf['chinaTotal']['dead'])
insideSummary.diedRelative = int(dataf['chinaAdd']['dead'])
return insideSummary
##########################################################################################################
#存储数据于数据库
#保存国内疫情概况数据
# 保存国内疫情概况数据
def insert(res):
# 创建连接,并且返回连接对象
conn =pymysql.connect(host='localhost',user='root',db='covid19_datas_guangxi',passwd='kfq991122',charset='utf8')
conn = pymysql.connect(host='localhost', user='root', db='covid19', passwd='kfq991122')
# 创建游标对象
cursor = conn.cursor()
date = data['lastUpdateTime'].split(' ',1)[0]
print(date)
date = data['lastUpdateTime']
sql = 'delete from home_realtime_datas where updatedTime like "%s"' % (date + '%')
print('The update was successful')
print('delete old_insidesummary_datas successful')
try:
cursor.execute(sql)
conn.commit()
except Exception as e:
print(e)
sql = 'insert into home_realtime_datas(curConfirm,curConfirmRelative,asymptomatic,asymptomaticRelative,unconfirmed,unconfirmedRelative,icu,icuRelative,confirmed,confirmedRelative,overseasInput,overseasInputRelative,cured,curedRelative,died,diedRelative,updatedTime) values(%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s)'
try:
cursor.execute(sql, res)
conn.commit()
print("+++ save_insidesummary_datas successful")
print('+++ save_outsideSummary_datas, data len: %d' % len(res))
except Exception as e:
print(e)
print('+++ save_province_datas is over.')
print('+++ save_insidesummary_datas fail.')
print('+++ save_insidesummary_datas is over.')
cursor.close()
conn.close()
insert(fetch_inside_summary(data).get_inside_summary_tuple())
########InsideSummary__main__####################
data = get_text()
insert(fetch_inside_summary().get_inside_summary_tuple())
conn = pymysql.connect('localhost','root','kfq991122','covid19_datas_guangxi')
cursor = conn.cursor()
sql = 'select * from home_realtime_datas'
cursor.execute(sql)
results = cursor.fetchall()
print(results)
InsideSummary()
Loading…
Cancel
Save