diff --git a/split.py b/split.py new file mode 100644 index 0000000000000000000000000000000000000000..70f1c027110d1615f1a5618254235c3a29207315 --- /dev/null +++ b/split.py @@ -0,0 +1,37 @@ +import numpy as np +import pandas as pd + +filename = "原始数据/人工标注.xlsx" +filepath='人工标注/' + +# filename = "原始数据/纯AI.csv" +# filepath='纯AI/' + +df = pd.read_excel(filename,encoding='gbk',header=0) + +UID='' +cnt=[] +for indexs in df.index: + data=df.loc[indexs].values + uesr=data[0] + studyID=data[1] + seriesID=data[2] + startTime=data[3] + endTime=data[4] + pos=data[5] + typeID=data[6] + typeNmae=data[7] + if UID=='': + UID=seriesID + cnt.append(data) + elif UID==seriesID: + cnt.append(data) + elif UID!=seriesID: + output = pd.DataFrame(cnt) + output.to_csv(filepath+str(UID)+".csv",encoding='gbk',header=["手机号码","检查编号","序列编号","开始时间","提交时间","影像结果","肺结节类型","肺结节类型 - Mapping"]) + UID=seriesID + cnt=[] + cnt.append(data) + +output = pd.DataFrame(cnt) +output.to_csv(filepath+str(UID)+".csv",encoding='gbk',header=["手机号码","检查编号","序列编号","开始时间","提交时间","影像结果","肺结节类型","肺结节类型 - Mapping"]) \ No newline at end of file