-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdata.py
More file actions
49 lines (43 loc) · 1.29 KB
/
data.py
File metadata and controls
49 lines (43 loc) · 1.29 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
import pandas as pd
import numpy as np
oridata=pd.read_excel (r'C:\Users\86159\Desktop\我的\科研与竞赛\大创\2021-2022\九月\20210831_医案数据.xlsx')
oridata=oridata .iloc[:60,:]
oridata.to_excel('multi_code\datasets\data_all.xlsx')
'''
data=pd.read_excel ('multi_code\datasets\data_all.xlsx')
data=data.iloc[:100,:]
sym=data.iloc[:,2]
med=data.iloc[:,3]
str=sym.iloc[-1]
str1=med.iloc[-1]
for i in range(len(sym)-1):
str1=str1+';'+med.iloc[i]
str=str+';'+sym.iloc[i]
symlis=str.split(';')
medlis=str1.split(';')
print('------symlis------')
#print(symlis)
print('------medlis------')
#print(medlis)
symlis=sorted(set(symlis))
medlis=sorted(set(medlis))
symdic=dict(zip(symlis,range(len(symlis))))
print('------symdic------')
print(symdic)
meddic=dict(zip(medlis,range(len(medlis))))
print('------meddic-----')
print(meddic)
print(len(data),len(symdic ))
symmat=np.zeros((len(data),len(symdic )))
for i in range(len(sym)):
symf1=sym[i].split(';')
for j in symf1:
symmat[i][symdic[j]]=1
np.savetxt('multi_code\datasets\symmat.txt',symmat)
medmat=np.zeros((len(data),len(meddic )))
for i in range(len(med)):
symf1=med[i].split(';')
for j in symf1:
medmat[i][meddic[j]]=1
np.savetxt('multi_code\datasets\medmat.txt',medmat)
print('----------done!!!!!-----------')'''