-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathrun_ptq_smnist_eval_lnnb.sh
109 lines (97 loc) · 5.2 KB
/
run_ptq_smnist_eval_lnnb.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
echo "FP: eval-ptq--smnist-full-ln_nb--fp"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--use_layernorm_bias=False \
--run_name=eval-ptq--smnist-full-ln_nb--fp
echo "W8A8"
echo "W8A8 gelu, sigmoid, LayerNorm: eval-ptq--smnist-full-ln_nb--W8A8-gelu-sigmoid-ln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=8 --c_bits=8 --d_bits=8 --non_ssm_bits=8 \
--use_qlayernorm_if_quantized=False --use_layernorm_bias=False \
--run_name=eval-ptq--smnist-full-ln_nb--W8A8-gelu-sigmoid-ln
echo "W8A8 + qgelu"
echo "W8A8 qgelu, sigmoid, LayerNorm: eval-ptq--smnist-full-ln_nb--W8A8-qgelu-sigmoid-ln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=8 --c_bits=8 --d_bits=8 --non_ssm_bits=8 \
--use_qlayernorm_if_quantized=False --use_layernorm_bias=False \
--qgelu_approx \
--run_name=eval-ptq--smnist-full-ln_nb--W8A8-qgelu-sigmoid-ln
echo "W8A8 + hard sigmoid"
echo "W8A8 gelu, hard sigmoid, LayerNorm: eval-ptq--smnist-full-ln_nb--W8A8-gelu-hsigmoid-ln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=8 --c_bits=8 --d_bits=8 --non_ssm_bits=8 \
--use_qlayernorm_if_quantized=False --use_layernorm_bias=False \
--hard_sigmoid \
--run_name=eval-ptq--smnist-full-ln_nb--W8A8-gelu-hsigmoid-ln
echo "W8A8 + qlayernorm"
echo "W8A8 Gelu, Sigmoid, qLayerNorm: eval-ptq--smnist-full-ln_nb--W8A8-gelu-sigmoid-qln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=8 --c_bits=8 --d_bits=8 --non_ssm_bits=8 \
--use_qlayernorm_if_quantized=True --use_layernorm_bias=True \
--run_name=eval-ptq--smnist-full-ln_nb--W8A8-gelu-sigmoid-qln
echo "W8A8 + qgelu + hard sigmoid + qlayernorm"
echo "W8A8 Gelu, Sigmoid, qLayerNorm: eval-ptq--smnist-full-ln_nb--W8A8-qgelu-hsigmoid-qln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=8 --c_bits=8 --d_bits=8 --non_ssm_bits=8 \
--use_qlayernorm_if_quantized=True --use_layernorm_bias=True \
--hard_sigmoid --qgelu_approx \
--run_name=eval-ptq--smnist-full-ln_nb--W8A8-qgelu-hsigmoid-qln
#### Lower quantizations
echo "W4A8Wssm8 Gelu, Sigmoid, qLayerNorm: eval-ptq--smnist-full-ln_nb--W4A8Wssm8-qgelu-hsigmoid-qln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=8 --c_bits=8 --d_bits=8 --non_ssm_bits=4 \
--use_qlayernorm_if_quantized=True --use_layernorm_bias=True \
--hard_sigmoid --qgelu_approx \
--run_name=eval-ptq--smnist-full-ln_nb--W4A8Wssm8-qgelu-hsigmoid-qln
echo "W4A8Wa8 Gelu, Sigmoid, qLayerNorm: eval-ptq--smnist-full-ln_nb--W4A8Wa8-qgelu-hsigmoid-qln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=4 --c_bits=4 --d_bits=4 --non_ssm_bits=4 \
--use_qlayernorm_if_quantized=True --use_layernorm_bias=True \
--hard_sigmoid --qgelu_approx \
--run_name=eval-ptq--smnist-full-ln_nb--W4A8Wa8-qgelu-hsigmoid-qln
echo "W4A8 Gelu, Sigmoid, qLayerNorm: eval-ptq--smnist-full-ln_nb--W4A8-qgelu-hsigmoid-qln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=4 --b_bits=4 --c_bits=4 --d_bits=4 --non_ssm_bits=4 \
--use_qlayernorm_if_quantized=True --use_layernorm_bias=True \
--hard_sigmoid --qgelu_approx \
--run_name=eval-ptq--smnist-full-ln_nb--W4A8-qgelu-hsigmoid-qln
echo "W2A8Wssm8 Gelu, Sigmoid, qLayerNorm: eval-ptq--smnist-full-ln_nb--W2A8Wssm8-qgelu-hsigmoid-qln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=8 --c_bits=8 --d_bits=8 --non_ssm_bits=2 \
--use_qlayernorm_if_quantized=True --use_layernorm_bias=True \
--hard_sigmoid --qgelu_approx \
--run_name=eval-ptq--smnist-full-ln_nb--W2A8Wssm8-qgelu-hsigmoid-qln
echo "W2A8Wa8 Gelu, Sigmoid, qLayerNorm: eval-ptq--smnist-full-ln_nb--W2A8Wa8-qgelu-hsigmoid-qln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=8 --b_bits=2 --c_bits=2 --d_bits=2 --non_ssm_bits=2 \
--use_qlayernorm_if_quantized=True --use_layernorm_bias=True \
--hard_sigmoid --qgelu_approx \
--run_name=eval-ptq--smnist-full-ln_nb--W2A8Wa8-qgelu-hsigmoid-qln
echo "W2A8 Gelu, Sigmoid, qLayerNorm: eval-ptq--smnist-full-ln_nb--W2A8-qgelu-hsigmoid-qln"
sbatch eval_smnist.sh \
--load_run_name=smnist-full-ln_nb --batchnorm=False \
--non_ssm_act_bits=8 --ssm_act_bits=8 \
--a_bits=2 --b_bits=2 --c_bits=2 --d_bits=2 --non_ssm_bits=2 \
--use_qlayernorm_if_quantized=True --use_layernorm_bias=True \
--hard_sigmoid --qgelu_approx \
--run_name=eval-ptq--smnist-full-ln_nb--W2A8-qgelu-hsigmoid-qln