From 0e0721806b003cfe02c5253de367e8b4662359ae Mon Sep 17 00:00:00 2001 From: p5rqvkz4o <493566904@qq.com> Date: Fri, 18 Apr 2025 09:14:53 +0800 Subject: [PATCH] =?UTF-8?q?=E8=AF=BB=E5=8F=96csv=E6=96=87=E4=BB=B6=20?= =?UTF-8?q?=E5=8F=AF=E4=BE=9B=E7=AE=80=E5=8D=95=E5=AE=9E=E7=94=A8?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- Code_Reticent/ReadData.py | 44 +++++++++++++++++++++++++++++++++++++++ 1 file changed, 44 insertions(+) create mode 100644 Code_Reticent/ReadData.py diff --git a/Code_Reticent/ReadData.py b/Code_Reticent/ReadData.py new file mode 100644 index 0000000..1838981 --- /dev/null +++ b/Code_Reticent/ReadData.py @@ -0,0 +1,44 @@ +# -*- coding: utf-8 -*- +""" +Created on Fri Apr 18 08:11:13 2025 + +@author: 缄默 +""" +import csv + +##################config################### +trainDataPath = ["train1.csv","train2.csv"] +########################################### + +DataDic = {} +def ReadFile(): + for path in trainDataPath: + csvData = csv.reader(open(path)) + for row in list(csvData)[1:]: + tmp = row[0].split('_') + Idx,Speaker,Snt = tmp[1],tmp[-1],row[1] + if Idx not in DataDic: + DataDic.update({Idx:[]}) + DataDic[Idx].append(Speaker+' : '+Snt) + #DataDic[Idx].append(Snt) + +def Data2csv(path): + with open(path, 'w', newline='', encoding='utf-8') as f: + writer = csv.writer(f) + writer.writerows([["id","text"]]) + for key in DataDic.keys(): + length = len(DataDic[key]) + writer = csv.writer(f) + writer.writerows([[key,"\n".join(DataDic[key])]]) + """ + if(length<=3 or length>=10): + pass + else: + writer = csv.writer(f) + writer.writerows([[key,"\n".join(DataDic[key])]]) + """ + +ReadFile() +Data2csv('./output.csv') + + \ No newline at end of file