forked from zhangj111/astnn
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathopen_data.py
More file actions
42 lines (34 loc) · 1.19 KB
/
open_data.py
File metadata and controls
42 lines (34 loc) · 1.19 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
import os
import pickle
import pandas as pd
file_paths = ['./data/ast.pkl',
'./data/split_data/dev/blocks.pkl',
'./data/split_data/test/blocks.pkl',
'./data/split_data/train/blocks.pkl',
'./data/split_data/dev/dev.pkl',
'./data/split_data/test/test.pkl',
'./data/split_data/train/train.pkl'
]
def load_pickle_to_dataframe(file_path):
with open(file_path, 'rb') as infile:
return pd.read_pickle(infile)
def pkl_to_csv(path):
df = load_pickle_to_dataframe(path)
csv_file = path.replace('.pkl', '.csv')
df.to_csv(csv_file, index=False)
print(f'Successfully converted {path} to {csv_file}')
def tsv_to_csv(path):
df = pd.read_csv(path, sep='\t')
csv_file = path.replace('.tsv', '.csv')
df.to_csv(csv_file, index=False)
print(f'Successfully converted {path} to {csv_file}')
def convert_all():
for path in file_paths:
if path.endswith('.pkl'):
pkl_to_csv(path)
print('Saved csv')
elif path.endswith('.tsv'):
tsv_to_csv(path)
else:
print(f'Unsupported file format for {path}')
convert_all()