-
Notifications
You must be signed in to change notification settings - Fork 15
/
extract.py
executable file
·57 lines (40 loc) · 1.21 KB
/
extract.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
#!/usr/bin/env python
"""
Create hdf5 file with a subset of datasets from original hdf5 file
"""
import sys
import hdf5
from parser import get_args_extract as parser
import msg
import check
def update_data(data, keys, skip=None):
"""Remove not requested datasets.
Keyword arguments:
data -- dicionary with data
keys -- user-requested keys
skip -- the key not to delete
"""
loopkeys = list(data.keys())
for key in loopkeys:
if key == skip:
continue
if key not in keys:
del data[key]
if not len(data):
msg.error("No datasets to process.")
sys.exit(1)
check.get_size(data)
for key in keys:
if key not in data.keys():
msg.warning("%s requested, but not found." % key)
if __name__ == '__main__':
msg.box("HDF5 MANIPULATOR: EXTRACT")
args = parser()
data = hdf5.load(args.input)
print("The following datasets were found in %s:\n" % args.input)
msg.list_dataset(data)
update_data(data, [k.strip() for k in args.keys.split(',')])
print("\nThe following dataset will be saved in %s:\n" % args.output)
msg.list_dataset(data)
hdf5.save(args.output, data)
msg.info("Done")