-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathrun_scifar_all copy.sh
31 lines (27 loc) · 1.16 KB
/
run_scifar_all copy.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
# W8A8
echo "scifar-W8A8"
sbatch run_scifar.sh --non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=8 --c_bits=8 --d_bits=8 --non_ssm_bits=8 \
--qgelu_approx --hard_sigmoid --batchnorm=False \
--run_name=scifar-W8A8
### Towards 4-bit weights
# W8A8 for SSM, W4A8 for non-SSM
echo "scifar-W4A8Wssm8"
sbatch run_scifar.sh --non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=8 --c_bits=8 --d_bits=8 --non_ssm_bits=4 \
--qgelu_approx --hard_sigmoid --batchnorm=False \
--run_name=scifar-W4A8Wssm8-lnrm
# W8A8 for A, W4A8 for everything else
echo "scifar-W4A8Wa8"
sbatch run_scifar.sh --non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=4 --c_bits=4 --d_bits=4 --non_ssm_bits=4 \
--qgelu_approx --hard_sigmoid --batchnorm=False \
--run_name=scifar-W4A8Wa8-lnrm
### Towards 2-bit weights
# W8A8 for SSM, W2A8 for non-SSM
# ---- is this needed? we mainly care about recurrent vs. feedforward
echo "scifar-W2A8Wssm8"
sbatch run_scifar.sh --non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=8 --c_bits=8 --d_bits=8 --non_ssm_bits=2 \
--qgelu_approx --hard_sigmoid --batchnorm=False \
--run_name=scifar-W2A8Wssm8-lnrm