You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
p4fkfpicj/OS.ipynb

203 lines
7.0 KiB

{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"# 定义实体类"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {
"scrolled": true
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"+++ [MyDB] delete from outsideSummary_realtime_datas\n",
"+++ save_outsideSummary_datas, data len: 1\n",
"+++ save_outsideSummary_datas is over.\n"
]
}
],
"source": [
"# 国外疫情实时概况\n",
"def OutsideSummary(dsin):\n",
" class OutsideSummary:\n",
" def __init__(self):\n",
" self.currentConfirmedCount = 0\n",
" self.confirmedCount = 0\n",
" self.suspectedCount = 0\n",
" self.curedCount = 0\n",
" self.deadCount = 0\n",
" self.suspectedIncr = 0\n",
" self.currentConfirmedIncr = 0\n",
" self.confirmedIncr = 0\n",
" self.curedIncr = 0\n",
" self.deadIncr = 0\n",
" self.updatedTime = datetime.datetime.now().strftime('%Y-%m-%d %H:%M:%S')\n",
"\n",
"\n",
" def get_info_tuple(self):\n",
" return (self.currentConfirmedCount, self.confirmedCount, self.suspectedCount, self.curedCount,\n",
" self.deadCount, self.suspectedIncr, self.currentConfirmedIncr, self.confirmedIncr, self.curedIncr,\n",
" self.deadIncr, self.updatedTime)\n",
"\n",
"\n",
" def __str__(self):\n",
" return 'currentConfirmedCount:%s, confirmedCount:%s, suspectedCount:%s, curedCount:%s, deadCount:%s, suspectedIncr:%s, currentConfirmedIncr:%s, confirmedIncr:%s, curedIncr:%s, deadIncr:%s, updatedTime:%s' % (\n",
" self.currentConfirmedCount, self.confirmedCount, self.suspectedCount, self.curedCount, self.deadCount,\n",
" self.suspectedIncr, self.currentConfirmedIncr, self.confirmedIncr, self.curedIncr, self.deadIncr, self.updatedTime)\n",
"\n",
" # 数据库实体类\n",
"\n",
" #数据库实体类\n",
" import pymysql\n",
" class MyDB:\n",
" def __init__(self, host, user, passwd, db):\n",
" self.conn = pymysql.connect(host, user, passwd, db)\n",
" self.cursor = self.conn.cursor()\n",
"\n",
"\n",
" def get_outsideSummary_list_tuple(self, outsideSummary):\n",
" info_tuple = []\n",
" info_tuple.append(outsideSummary.get_info_tuple())\n",
" return info_tuple\n",
"\n",
"\n",
" # 保存数据\n",
" def save_outsideSummary_datas(self, outsideSummary):\n",
" print('+++ [MyDB] delete from outsideSummary_realtime_datas') \n",
" self.cursor.execute('delete from outsideSummary_realtime_datas') \n",
" self.conn.commit()\n",
"\n",
" sql = 'insert into outsideSummary_realtime_datas(currentConfirmedCount,confirmedCount,suspectedCount,curedCount,deadCount,suspectedIncr,currentConfirmedIncr,confirmedIncr,curedIncr,deadIncr,updatedTime) values(%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s)'\n",
" res = self.get_outsideSummary_list_tuple(outsideSummary)\n",
" print('+++ save_outsideSummary_datas, data len: %d' % len(res))\n",
" try:\n",
" self.cursor.executemany(sql, res)\n",
" self.conn.commit()\n",
" except Exception as e:\n",
" print(e)\n",
" print('+++ save_outsideSummary_datas is over.')\n",
"\n",
"\n",
" def __del__(self):\n",
" if self.conn is not None:\n",
" self.conn.close()\n",
"\n",
" # 业务逻辑类\n",
"\n",
" #业务逻辑类\n",
" import datetime\n",
" import requests\n",
" import re\n",
" from bs4 import BeautifulSoup\n",
" import json\n",
"\n",
"\n",
"\n",
" class DataService:\n",
" def __init__(self,ds):\n",
" self.db = MyDB(host = ds[0],user = ds[1],passwd = ds[2],db = ds[3])\n",
"\n",
"\n",
" # 爬取页面\n",
" res = requests.get('https://ncov.dxy.cn/ncovh5/view/pneumonia')\n",
"\n",
" # 重新解码\n",
" res = res.content.decode('utf-8')\n",
"\n",
" # 构建soup对象\n",
" soup = BeautifulSoup(res, 'html.parser')\n",
"\n",
" # 使用soup对象查找国外疫情数据标签\n",
" tag = soup.find('script', attrs={'id': 'getStatisticsService'})\n",
"\n",
" # 转成字符串\n",
" tagstr = tag.string\n",
" # 使用正则表达式查找所有内容\n",
" result = re.findall('\\{\"currentConfirmedCount\".*?\"deadIncr\".*?\\}', tagstr)\n",
"\n",
" # 获取国外疫情数据\n",
" #print(result[0])\n",
" obj = json.loads(result[0])\n",
"\n",
"\n",
"\n",
" #print(obj)\n",
" def fetch_outside_summary(obj):\n",
" outsideSummary = OutsideSummary()\n",
" outsideSummary.currentConfirmedCount = int(obj['currentConfirmedCount'])\n",
" outsideSummary.confirmedCount = int(obj['confirmedCount'])\n",
" outsideSummary.suspectedCount = int(obj['suspectedCount'])\n",
" outsideSummary.curedCount = int(obj['curedCount'])\n",
" outsideSummary.deadCount = int(obj['deadCount'])\n",
" outsideSummary.suspectedIncr = int(obj['suspectedIncr'])\n",
" outsideSummary.currentConfirmedIncr = int(obj['currentConfirmedIncr'])\n",
" outsideSummary.confirmedIncr = int(obj['confirmedIncr'])\n",
" outsideSummary.curedIncr = int(obj['curedIncr'])\n",
" outsideSummary.deadIncr = int(obj['deadIncr'])\n",
" outsideSummary.updatedTime = datetime.datetime.now().strftime('%Y-%m-%d %H:%M:%S')\n",
" return outsideSummary\n",
"\n",
"\n",
"\n",
" # 创建Dataservice对象\n",
" ds = DataService(dsin)\n",
" outsideSummary=fetch_outside_summary(obj)\n",
" ds.db.save_outsideSummary_datas(outsideSummary)\n",
" \n",
"ds=['localhost','root','20Z00t10x28_my','covid19']\n",
"OutsideSummary(ds)\n"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.8.3"
}
},
"nbformat": 4,
"nbformat_minor": 4
}