parent
cb058a7d10
commit
a744889753
@ -0,0 +1,32 @@
|
||||
import csv
|
||||
import Snt2Int
|
||||
|
||||
|
||||
# 目前通过文件读取,可作为头文件调用
|
||||
|
||||
##################config###################
|
||||
trainDataPath = ["train1.csv","train2.csv"]
|
||||
###########################################
|
||||
DataDic = {}
|
||||
|
||||
|
||||
def ReadFile():
|
||||
for path in trainDataPath:
|
||||
csvData = csv.reader(open(path))
|
||||
for row in list(csvData)[1:]:
|
||||
tmp = row[0].split('_')
|
||||
Idx,Speaker,Snt = tmp[1],tmp[-1],row[1]
|
||||
if Idx not in DataDic:
|
||||
DataDic.update({Idx:[]})
|
||||
#DataDic[Idx].append(Speaker+' : '+Snt)
|
||||
DataDic[Idx].append(Snt)
|
||||
|
||||
def Data2csv(path):
|
||||
with open(path, 'w', newline='', encoding='utf-8') as f:
|
||||
writer = csv.writer(f)
|
||||
writer.writerows([["id","text"]])
|
||||
for key in DataDic.keys():
|
||||
writer = csv.writer(f)
|
||||
writer.writerows([[key,"\n".join(DataDic[key]),"\n".join([Snt2Int.Snt2Int(i) for i in DataDic[key]])]])
|
||||
ReadFile()
|
||||
Data2csv('./test_Snt2Int.csv')
|
Loading…
Reference in new issue