annotate transform_json_to_pkl.py @ 0:d133a3433309 draft default tip

Uploaded
author bebatut
date Mon, 27 Feb 2017 06:13:29 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
d133a3433309 Uploaded
bebatut
parents:
diff changeset
1 #!/usr/bin/env python
d133a3433309 Uploaded
bebatut
parents:
diff changeset
2 # -*- coding: utf-8 -*-
d133a3433309 Uploaded
bebatut
parents:
diff changeset
3
d133a3433309 Uploaded
bebatut
parents:
diff changeset
4 import argparse
d133a3433309 Uploaded
bebatut
parents:
diff changeset
5 import bz2
d133a3433309 Uploaded
bebatut
parents:
diff changeset
6 import cPickle as pickle
d133a3433309 Uploaded
bebatut
parents:
diff changeset
7 import json
d133a3433309 Uploaded
bebatut
parents:
diff changeset
8
d133a3433309 Uploaded
bebatut
parents:
diff changeset
9
d133a3433309 Uploaded
bebatut
parents:
diff changeset
10 def transform_json_to_pkl(args):
d133a3433309 Uploaded
bebatut
parents:
diff changeset
11 with open(args.json_input, 'r') as json_file:
d133a3433309 Uploaded
bebatut
parents:
diff changeset
12 json_str = json_file.read()
d133a3433309 Uploaded
bebatut
parents:
diff changeset
13 metadata = json.loads(json_str)
d133a3433309 Uploaded
bebatut
parents:
diff changeset
14
d133a3433309 Uploaded
bebatut
parents:
diff changeset
15 for marker in metadata["markers"]:
d133a3433309 Uploaded
bebatut
parents:
diff changeset
16 a_set = set(metadata["markers"][marker]["ext"])
d133a3433309 Uploaded
bebatut
parents:
diff changeset
17 metadata["markers"][marker]["ext"] = a_set
d133a3433309 Uploaded
bebatut
parents:
diff changeset
18
d133a3433309 Uploaded
bebatut
parents:
diff changeset
19 pkl_output = bz2.BZ2File(args.pkl_output, 'w')
d133a3433309 Uploaded
bebatut
parents:
diff changeset
20 pickle.dump(metadata, pkl_output, pickle.HIGHEST_PROTOCOL)
d133a3433309 Uploaded
bebatut
parents:
diff changeset
21 pkl_output.close()
d133a3433309 Uploaded
bebatut
parents:
diff changeset
22
d133a3433309 Uploaded
bebatut
parents:
diff changeset
23
d133a3433309 Uploaded
bebatut
parents:
diff changeset
24 if __name__ == '__main__':
d133a3433309 Uploaded
bebatut
parents:
diff changeset
25 parser = argparse.ArgumentParser()
d133a3433309 Uploaded
bebatut
parents:
diff changeset
26 parser.add_argument('--json_input', required=True)
d133a3433309 Uploaded
bebatut
parents:
diff changeset
27 parser.add_argument('--pkl_output', required=True)
d133a3433309 Uploaded
bebatut
parents:
diff changeset
28 args = parser.parse_args()
d133a3433309 Uploaded
bebatut
parents:
diff changeset
29
d133a3433309 Uploaded
bebatut
parents:
diff changeset
30 transform_json_to_pkl(args)