-
Notifications
You must be signed in to change notification settings - Fork 0
/
reducer.py
117 lines (81 loc) · 3.35 KB
/
reducer.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
#!/bin/python3
"""
About this Script
* Run at the command line with the following arguments (in order):
** Desired key
** Relative path to JSON file (or files - not hard limit)
Ian Richard Ferguson | Stanford University
"""
# ---------- Imports
import os
import json
import sys
from tqdm import tqdm
# ---------- Setup
def checkCommandLine():
"""
Confirms End User has entered valid arguments
"""
ux = sys.argv
# User didn't include key and JSON
if len(ux) < 2:
print("\nHeck! Invalid user input\n\nYour input:\t{}\n".format(ux))
sys.exit(1)
# Incorrect order of arguments (JSON files come last)
for userEntry in ux[2:]:
if ".json" not in userEntry:
print("\nInvalid user entry - run python3 main.py [ KEY VALUE ] [ JSON FILE ]\n")
sys.exit(1)
def parseUserInput():
"""
Assumes command line input has already been checked
Returns string object (desired key) and list object (list of JSONs, may only be one)
"""
ux = sys.argv # List of command line args
keyName = ux[1] # Key val must come before JSON files
JSON_files = ux[2:] # May be 1 or more JSON files
return keyName, JSON_files
def directoryTree(KEY):
"""
Standardized output flow for reduced JSON files
Makes output directory AND returns string value of relative path
"""
path = ("./OUTPUT/{}/".format(KEY)) # Relative output path
# If Output parent dir doesn't exist at all..
if not os.path.isdir("./OUTPUT/"):
os.mkdir("./OUTPUT/")
# Make subdir within Output dir
if not os.path.isdir(path):
os.mkdir(path)
return path
def outputName(KEYVALUE, JSON):
"""
Returns name of output JSON file
"""
temp = str(JSON)[:-5] # Isolate filename without extension
temp = temp.split('/')[-1] # Strip leading directory path
temp += "_{}-only.json".format(KEYVALUE) # Append to filename
return temp
def isoUSER(KEYVALUE, JSON, PATH):
"""
Reduces JSON file down to desired key tree
"""
newName = outputName(KEYVALUE, JSON) # Generate output filename
with open(JSON) as incoming:
temp = json.load(incoming) # Read JSON as dictionary
temp = temp[KEYVALUE] # Reduce JSON to desired key
with open(os.path.join(PATH, newName), "w") as outgoing:
json.dump(temp, outgoing, indent=4) # Write JSON to Output dir
def main():
"""
Let's get it
"""
checkCommandLine() # Confirm arguments supplied
user_value, json_list = parseUserInput() # Isolate arguments
path = directoryTree(user_value) # Save output path to memory
# In case multiple JSONs are provided...
for k in tqdm(json_list):
isoUSER(user_value, k, path)
print("All JSON values parsed - see {} for output\n".format(path))
if __name__ == "__main__":
main()