forked from Erosinho13/LADD
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun.sh
executable file
·56 lines (45 loc) · 1.6 KB
/
run.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#!/usr/bin/env bash
########################################################################################################################
function init() {
device_ids=-1
batch_size=-1
framework=-1
fw_task=-1
}
function run() {
cd "${path}"/src/ || exit 1
${command}
}
########################################################################################################################
path=$(pwd)
port=$(python get_free_port.py)
config_path="$1"
command="python3 -W ignore -m torch.distributed.launch --nproc_per_node * --master_port=${port} run.py"
while IFS="=" read -r arg value; do
if [ "${arg}" != "" ]; then
if [ "${value}" = "" ]; then
command="${command} --${arg}"
else
declare "${arg}"="${value}"
if [ "${arg}" = "device_ids" ]; then
device_ids="${value}"
device_ids="${device_ids:1:-1}"
IFS=' ' read -r -a device_ids_array <<< "${device_ids}"
num_devices=${#device_ids_array[@]}
command="${command} --device_ids ${device_ids}"
elif [ "${arg}" = "batch_size" ]; then
batch_size_per_device=$((batch_size/num_devices))
command="${command} --batch_size ${batch_size_per_device%.*}"
else
command="${command} --${arg} ${value}"
fi
fi
fi
done < "$config_path"
batch_size_per_device=$((batch_size/num_devices))
command=${command//[*]/${num_devices}}
########################################################################################################################
echo "GPUs in usage:" "${device_ids_array[@]}"
echo "Running ${framework} ${fw_task} experiment..."
run
echo "Done."