-
Notifications
You must be signed in to change notification settings - Fork 2
/
train-hpc.sh
41 lines (38 loc) · 1.18 KB
/
train-hpc.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
#!/bin/sh
### General options
### --- specify queue --
#BSUB -q gpuv100
### -- set the job Name --
#BSUB -J train
### -- ask for number of cores (default: 1) --
#BSUB -n 1
### -- Select the resources: 1 gpu in exclusive process mode --
#BSUB -gpu "num=1:mode=exclusive_process"
### -- set walltime limit: hh:mm -- maximum 24 hours for GPU-queues right now
#BSUB -W 24:00
# request 30GB of system-memory
#BSUB -R "rusage[mem=30GB]"
### -- set the email address --
# please uncomment the following line and put in your e-mail address,
# if you want to receive e-mail notifications on a non-default address
#BSUB -u [email protected]
### -- send notification at start --
#BSUB -B
### -- send notification at completion--
#BSUB -N
### -- Specify the output and error file. %J is the job-id --
### -- -o and -e mean append, -oo and -eo mean overwrite --
#BSUB -o training-%J.out
#BSUB -e training_%J.err
# -- end of LSF options --
nvidia-smi
# Load the cuda module
module load cuda/9.1
# setup python3 env
module load python3/3.6.2
pip3 install --user virtualenv
virtualenv env
. env/bin/activate
python3 -m pip install --no-cache-dir -r requirements.txt
# running script
python3 main.py --do-train=True