From 16c3c880915634c111e3d5e7a5fe1741fb1ef4d3 Mon Sep 17 00:00:00 2001 From: p5rqvkz4o <493566904@qq.com> Date: Fri, 18 Apr 2025 08:53:45 +0800 Subject: [PATCH] =?UTF-8?q?=E8=AF=BB=E5=85=A5=E6=95=B0=E6=8D=AE=E5=B9=B6?= =?UTF-8?q?=E5=86=99=E5=85=A5csv=20=20=E5=9F=BA=E7=A1=80id+text?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- Code_reticent/ReadData.py | 44 +++++++++++++++++++++++++++++++++++++++ 1 file changed, 44 insertions(+) create mode 100644 Code_reticent/ReadData.py diff --git a/Code_reticent/ReadData.py b/Code_reticent/ReadData.py new file mode 100644 index 0000000..1838981 --- /dev/null +++ b/Code_reticent/ReadData.py @@ -0,0 +1,44 @@ +# -*- coding: utf-8 -*- +""" +Created on Fri Apr 18 08:11:13 2025 + +@author: 缄默 +""" +import csv + +##################config################### +trainDataPath = ["train1.csv","train2.csv"] +########################################### + +DataDic = {} +def ReadFile(): + for path in trainDataPath: + csvData = csv.reader(open(path)) + for row in list(csvData)[1:]: + tmp = row[0].split('_') + Idx,Speaker,Snt = tmp[1],tmp[-1],row[1] + if Idx not in DataDic: + DataDic.update({Idx:[]}) + DataDic[Idx].append(Speaker+' : '+Snt) + #DataDic[Idx].append(Snt) + +def Data2csv(path): + with open(path, 'w', newline='', encoding='utf-8') as f: + writer = csv.writer(f) + writer.writerows([["id","text"]]) + for key in DataDic.keys(): + length = len(DataDic[key]) + writer = csv.writer(f) + writer.writerows([[key,"\n".join(DataDic[key])]]) + """ + if(length<=3 or length>=10): + pass + else: + writer = csv.writer(f) + writer.writerows([[key,"\n".join(DataDic[key])]]) + """ + +ReadFile() +Data2csv('./output.csv') + + \ No newline at end of file