generated from Lightning-AI/deep-learning-project-template
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun.sh
43 lines (41 loc) · 1.28 KB
/
run.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
#!/bin/sh
### General options
### specify queue --
#BSUB -q gpuv100
### -- set the job Name --
#BSUB -J test_stl10
### -- ask for number of cores (default: 1) --
#BSUB -n 4
#BSUB -R "span[hosts=1]"
### -- Select the resources: 1 gpu in exclusive process mode --
#BSUB -gpu "num=1:mode=exclusive_process"
### -- set walltime limit: hh:mm -- maximum 24 hours for GPU-queues right now
#BSUB -W 24:00
# request 5GB of system-memory
#BSUB -R "rusage[mem=6GB]"
### -- set the email address
#BSUB -u [email protected]
### -- send notification at start --
#BSUB -B
### -- send notification at completion--
#BSUB -N
### -- Specify the output and error file. %J is the job-id --
### -- -o and -e mean append, -oo and -eo mean overwrite --
#BSUB -o sggm/job_logs/gpu-%J.out
#BSUB -e sggm/job_logs/gpu-%J.err
# -- end of LSF options --
nvidia-smi
# Load the cuda module
module unload python/2.7.13_ucs4
module load python3/3.7.7
module load cuda/10.2
module load cudnn/v7.6.5.32-prod-cuda-10.2
#ENV
python3 -m venv env
source env/bin/activate
python3 -m pip install -r requirements.txt
export PYTHONIOENCODING=utf8
# Our model run
cd sggm/ && python experiment.py --experiments_config configs/debug_local.yml --gpus -1
# Baselines run
# cd sggm/ && python baselines/run.py --experiment_name uci_carbon --n_trials 20