-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun_all.py
114 lines (97 loc) · 3.93 KB
/
run_all.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
# !/usr/bin/env python
# -*- coding: utf-8
#########################################################################################
#
# Break down multiprocessing jobs across sub-datasets
# example: python run_all.py -config config_sct_run_batch.yml
#
#########################################################################################
import os
import argparse
import yaml
def get_parser(mandatory=None):
"""parser function"""
parser = argparse.ArgumentParser(
description="Break down multiprocessing jobs across sub-datasets",
formatter_class=argparse.RawTextHelpFormatter,
prog=os.path.basename(__file__).strip(".py")
)
parser.add_argument(
'-config',
required=True,
help='Path to config file, which contains parameters for the command sct_run_batch.',
)
parser.add_argument(
'-job-template',
help="""Path to sbatch config file containing sbatch options preceded of #SBATCH. Example:
#SBATCH --account=def-jcohen
#SBATCH --time=0-08:00 # time (DD-HH:MM)
#SBATCH --nodes=1
#SBATCH --cpus-per-task=32 # number of OpenMP processes
#SBATCH --mem=128G
cd $SCRATCH""",
)
parser.add_argument(
'-n',
help="Break down multiprocessing jobs across sub-datasets of n subjects. Adjust 'n' based on the number of CPU cores "
"available",
type=int,
default=32
)
return parser
def yaml_parser(config_file):
"""parse config_script.yml file containing pipeline's parameters"""
with open(config_file, 'r') as config_var:
config_param = yaml.safe_load(config_var)
return config_param
# text for shell script
def bash_text(config_file, sublist, log_filename, job_template):
bash_job = """#!/bin/sh
{}
sct_run_batch -config {} -include-list {} -batch-log {}
""".format(job_template, config_file, str(sublist).replace("[", "").replace("]", "").replace("'", "").replace(",", ""), log_filename)
return bash_job
def main():
# Get parser arguments
parser = get_parser()
arguments = parser.parse_args()
config_file = os.path.abspath(os.path.expanduser(arguments.config))
# Check if sbatch config file was given with given with flag -job-template
if arguments.job_template is not None:
path_job_template = os.path.abspath(os.path.expanduser(arguments.job_template))
job_template = open(path_job_template, 'r').read()
else:
job_template = """#SBATCH --account=def-pabaua
#SBATCH --time=0-08:00 # time (DD-HH:MM)
#SBATCH --nodes=1
#SBATCH --cpus-per-task=32 # number of OpenMP processes
#SBATCH --mem=128G
"""
config_param = yaml_parser(config_file)
# get path for log file
dir_output = config_param['path_output']
path_output = os.path.abspath(os.path.expanduser(dir_output))
# Get list of subjects in path data
dir_data = config_param['path_data']
path_data = os.path.abspath(os.path.expanduser(dir_data))
list = os.listdir(path_data)
list_subjects = [subject for subject in list if "sub" in subject]
# Create X sublists of n subjects each
n = arguments.n
sublists = [list_subjects[i:i + n] for i in range(0, len(list_subjects), n)]
i = 0
# Loop across the sublists
for sublist in sublists:
i = i + 1
# Create temporary job shell script, default: job_csa_sublist_i.sh
filename = os.path.abspath(os.path.expanduser('tmp.job_csa_sublist_')) + str(i) + ".sh"
log_filename = os.path.join(path_output, "log", "log_" + os.path.basename(filename).split(".")[1] + ".txt")
# create shell script for sbatch
with open(filename, 'w+') as temp_file:
# bash content
temp_file.write(bash_text(config_file, sublist, log_filename, job_template))
temp_file.close()
# Run it
os.system('sbatch {}'.format(filename))
if __name__ == "__main__":
main()