From 07056695f2e29c533899cc29ae5b4fe9445e2ea7 Mon Sep 17 00:00:00 2001 From: phmycqkit <656078035@qq.com> Date: Wed, 18 Sep 2024 16:14:08 +0800 Subject: [PATCH] =?UTF-8?q?=E8=8E=B7=E5=8F=96=E6=95=B0=E9=87=8F=E5=89=8D8?= =?UTF-8?q?=E7=9A=84=E5=92=8CAI=E6=8A=80=E6=9C=AF=E5=BA=94=E7=94=A8?= =?UTF-8?q?=E7=9B=B8=E5=85=B3=E5=BC=B9=E5=B9=95?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- GetAI.py | 24 ++++++++++++++++++++++++ 1 file changed, 24 insertions(+) create mode 100644 GetAI.py diff --git a/GetAI.py b/GetAI.py new file mode 100644 index 0000000..a6aa2bd --- /dev/null +++ b/GetAI.py @@ -0,0 +1,24 @@ +import pandas as pd +from collections import Counter + +def GetAI(): + # 读取弹幕文件 + with open('danmu.csv', 'r', encoding='utf-8-sig') as f: + danmus = f.readlines() + + # 筛选与AI技术应用相关的弹幕 + keywords = ['ai','Ai','AI'] + ai_danmu = [danmu for danmu in danmus if any(keyword in danmu for keyword in keywords)] + + # 统计弹幕数量 + ai_danmu_counter = Counter(ai_danmu) + ai_danmu_most_common = ai_danmu_counter.most_common(8) + + df = pd.DataFrame(ai_danmu_most_common, columns=['弹幕', '数量']) + + # 保存为Excel文件 + filename = 'ai_danmu_most_common.xlsx' + df.to_excel(filename, index=False) + +if __name__ == '__main__': + GetAI() \ No newline at end of file