-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgenerate_data_json.py
63 lines (50 loc) · 1.34 KB
/
generate_data_json.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
#!/usr/bin/python3
import os
import sys
import json
DATA_FILE_PATH = "storage/data.json"
def find_all_files_by_ext(path, ext=".py", limit=0):
res = []
count = 0
for root, dirs, files in os.walk(path):
for file in files:
if limit > 0 and len(res) >= limit:
break
if file.endswith(ext):
res.append(os.path.join(root, file))
count += 1
return res
if __name__ == "__main__":
path = None
ext = None
limit = 0
language = None
context = None
question = None
for i, a in enumerate(sys.argv):
if i == 1:
path = a
elif i == 2:
ext = a
elif i == 3:
limit = int(a)
elif i == 4:
language = a
elif i == 5:
context = a
elif i == 6:
question = a
all_files = find_all_files_by_ext(path, ext, limit)
os.unlink(DATA_FILE_PATH)
data_list = []
for file_path in all_files:
tmp = {
"language": language,
"context": context,
"question": question,
"path": "/%s" % (file_path)
}
data_list.append(tmp)
with open(DATA_FILE_PATH, "a") as outfile:
json.dump(data_list, outfile)
print("data.json done. Found %s files" % (len(all_files)))