From 037a358fff577004c19fe6435016baa8fca32e4b Mon Sep 17 00:00:00 2001 From: hnu202111020211 Date: Fri, 31 Dec 2021 18:18:45 +0800 Subject: [PATCH] Update README.md --- README.md | 47 +++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 47 insertions(+) diff --git a/README.md b/README.md index cfe1150..28d11f1 100644 --- a/README.md +++ b/README.md @@ -1,2 +1,49 @@ # 1 +import requests +from lxml import etree +url = "https://www.bitpush.news/covid19/" +headers = {"user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/95.0.4638.69 Safari/537.36"} +response = requests.get(url, headers=headers) +html = response.text +encoding='utf-8' +parse = etree.HTMLParser(encoding='utf-8') +doc = etree.HTML(html) +states = doc.xpath('//div[@class="table_container"]//tbody/tr/td/span/text()') +print(states) +person = doc.xpath('//div[@class="table_container"]//tbody/tr/td[2]/text()') +print(person) +person = [x.replace(",", "") for x in person] +print(person) +death = doc.xpath('//div[@class="table_container"]//tbody/tr/td[3]/text()') +print(death) +death = [x.replace(",", "") for x in death] +message = list(zip(states, person, death)) +import csv +with open("content.csv", "w") as f: + w = csv.writer(f) + w.writerows(message) +print(w) +import pandas as pd +print("content.csv") +#读取数据 +df = pd.read_csv("content.csv", names=["states", "person", "death"]) +df.head() +print(df) +for i in range(101): + df.drop([i],inplace=True) +print(df) +df.sort_values(by=['person'],ascending=False,ignore_index=True) +print(df) +df=df.iloc[0:15] +print(df) +import matplotlib.pyplot as plt + +plt.rcParams['font.sans-serif'] = ['SimHei'] +plt.rcParams['figure.figsize'] = (10, 5) +x = df["states"].values +y = df['death'].values +plt.bar(x, y) +plt.xlabel("states") +plt.ylabel("death") +plt.show()