-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathbrunner.sh
executable file
·46 lines (34 loc) · 1.37 KB
/
brunner.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
#!/bin/bash
#SBATCH --gres=gpu:a40:1
# You can control the resources and scheduling with '#SBATCH' settings
# (see 'man sbatch' for more information on setting these parameters)
# The default partition is the 'general' partition
#SBATCH --partition=general
# The default Quality of Service is the 'short' QoS (maximum run time: 4 hours)
#SBATCH --qos=medium
# The default run (wall-clock) time is 1 minute
#SBATCH --time=00-07:00:00
# The default number of parallel tasks per job is 1
#SBATCH --ntasks=1
# Request 1 CPU per active thread of your program (assume 1 unless you specifically set this)
# The default number of CPUs per task is 1 (note: CPUs are always allocated per 2)
#SBATCH --cpus-per-task=8
# The default memory per node is 1024 megabytes (1GB) (for multiple tasks, specify --mem-per-cpu instead)
#SBATCH --mem=12000
# Set mail type to 'END' to receive a mail when the job finishes
# Do not enable mails when submitting large numbers (>20) of jobs at once
#SBATCH --mail-type=END
# 90 seconds before training ends, to help create a checkpoint and requeue the job
#SBATCH --signal=SIGUSR1@90
module use /opt/insy/modulefiles
module load cuda/11.3
module load miniconda/3.9
echo "Running Algo:"
echo "$1"
echo "With config:"
echo "$2"
echo "Additional args:"
echo "${@:3}"
source activate <env_path_here>
# send all remaining arguments
srun python "$1" --config "$2" "${@:3}"