@@ -58,44 +58,44 @@ jobs:
5858 echo "******************************************"
5959 echo "******* Emb : channel-wise quantized ******"
6060 echo "******************************************"
61- python generate.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
61+ python generate.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
6262 cat ./output_eager
63- python generate.py --dtype ${DTYPE} --compile --quant '{"embedding" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
63+ python generate.py --dtype ${DTYPE} --compile --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
6464 cat ./output_compiled
65- python export.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
65+ python export.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
6666 python generate.py --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
6767 cat ./output_aoti
6868
6969 echo "******************************************"
7070 echo "******** Emb : group-wise quantized *******"
7171 echo "******************************************"
72- python generate.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
72+ python generate.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
7373 cat ./output_eager
74- python generate.py --dtype ${DTYPE} --compile --quant '{"embedding" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
74+ python generate.py --dtype ${DTYPE} --compile --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
7575 cat ./output_compiled
76- python export.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
76+ python export.py --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
7777 python generate.py --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
7878 cat ./output_aoti
7979
8080 echo "******************************************"
8181 echo "******* INT8 channel-wise quantized ******"
8282 echo "******************************************"
83- python generate.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
83+ python generate.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
8484 cat ./output_eager
85- python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
85+ python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
8686 cat ./output_compiled
87- python export.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 0}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
87+ python export.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 0}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
8888 python generate.py --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
8989 cat ./output_aoti
9090
9191 echo "******************************************"
9292 echo "******** INT8 group-wise quantized *******"
9393 echo "******************************************"
94- python generate.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
94+ python generate.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
9595 cat ./output_eager
96- python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
96+ python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
9797 cat ./output_compiled
98- python export.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "group_size ": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
98+ python export.py --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize ": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
9999 python generate.py --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
100100 cat ./output_aoti
101101
@@ -106,11 +106,11 @@ jobs:
106106 DTYPE=bfloat16
107107 fi
108108
109- python generate.py --dtype ${DTYPE} --quant '{"linear:int4" : {"group_size ": 32}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
109+ python generate.py --dtype ${DTYPE} --quant '{"linear:int4" : {"groupsize ": 32}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
110110 cat ./output_eager
111- python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int4" : {"group_size ": 32}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
111+ python generate.py --dtype ${DTYPE} --compile --quant '{"linear:int4" : {"groupsize ": 32}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
112112 cat ./output_compiled
113- python export.py --dtype ${DTYPE} --quant '{"linear:int4" : {"group_size ": 32}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
113+ python export.py --dtype ${DTYPE} --quant '{"linear:int4" : {"groupsize ": 32}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
114114 python generate.py --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
115115 cat ./output_aoti
116116
0 commit comments