@@ -58,44 +58,44 @@ jobs:
58
58
echo "******************************************"
59
59
echo "******* Emb : channel-wise quantized ******"
60
60
echo "******************************************"
61
- python generate.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
61
+ python generate.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
62
62
cat ./output_eager
63
- python generate.py --dtype ${DTYPE} --compile --quant '{"embedding" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
63
+ python generate.py --dtype ${DTYPE} --compile --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
64
64
cat ./output_compiled
65
- python export.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
65
+ python export.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
66
66
python generate.py --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
67
67
cat ./output_aoti
68
68
69
69
echo "******************************************"
70
70
echo "******** Emb : group-wise quantized *******"
71
71
echo "******************************************"
72
- python generate.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
72
+ python generate.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
73
73
cat ./output_eager
74
- python generate.py --dtype ${DTYPE} --compile --quant '{"embedding" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
74
+ python generate.py --dtype ${DTYPE} --compile --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
75
75
cat ./output_compiled
76
- python export.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
76
+ python export.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
77
77
python generate.py --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
78
78
cat ./output_aoti
79
79
80
80
echo "******************************************"
81
81
echo "******* INT8 channel-wise quantized ******"
82
82
echo "******************************************"
83
- python generate.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
83
+ python generate.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
84
84
cat ./output_eager
85
- python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
85
+ python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
86
86
cat ./output_compiled
87
- python export.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
87
+ python export.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
88
88
python generate.py --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
89
89
cat ./output_aoti
90
90
91
91
echo "******************************************"
92
92
echo "******** INT8 group-wise quantized *******"
93
93
echo "******************************************"
94
- python generate.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
94
+ python generate.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
95
95
cat ./output_eager
96
- python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
96
+ python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
97
97
cat ./output_compiled
98
- python export.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
98
+ python export.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
99
99
python generate.py --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
100
100
cat ./output_aoti
101
101
@@ -106,11 +106,11 @@ jobs:
106
106
DTYPE=bfloat16
107
107
fi
108
108
109
- python generate.py --dtype ${DTYPE} --quant '{"linear:int4" : {"group_size ": 32}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
109
+ python generate.py --dtype ${DTYPE} --quant '{"linear:int4" : {"groupsize ": 32}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
110
110
cat ./output_eager
111
- python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int4" : {"group_size ": 32}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
111
+ python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int4" : {"groupsize ": 32}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
112
112
cat ./output_compiled
113
- python export.py --dtype ${DTYPE} --quant '{"linear:int4" : {"group_size ": 32}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
113
+ python export.py --dtype ${DTYPE} --quant '{"linear:int4" : {"groupsize ": 32}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
114
114
python generate.py --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
115
115
cat ./output_aoti
116
116
0 commit comments