diff --git a/GetAI.py b/GetAI.py new file mode 100644 index 0000000..e94dcd4 --- /dev/null +++ b/GetAI.py @@ -0,0 +1,28 @@ +import pandas as pd +from collections import Counter + +def GetAI(): + # 读取弹幕文件 + with open('danmu.csv', 'r', encoding='utf-8-sig') as f: + danmus = f.readlines() + + # 筛选与AI技术应用相关的弹幕 + keywords = ['ai','Ai','AI'] + ai_danmu = [danmu for danmu in danmus if any(keyword in danmu for keyword in keywords)] + + # 统计弹幕数量 + ai_danmu_counter = Counter(ai_danmu) + ai_danmu_most_common = ai_danmu_counter.most_common(8) + ai_danmu_all = ai_danmu_counter.most_common(100) + + # 保存为Excel文件 + df = pd.DataFrame(ai_danmu_most_common, columns=['弹幕', '数量']) + filename = 'ai_danmu_most_common.xlsx' + df.to_excel(filename, index=False) + + df = pd.DataFrame(ai_danmu_all, columns=['弹幕', '数量']) + filename = 'ai_danmu.xlsx' + df.to_excel(filename, index=False) + +if __name__ == '__main__': + GetAI() \ No newline at end of file