diff --git a/.github/workflows/compile.yml b/.github/workflows/compile.yml index 815dc3575..2e3d6ab1c 100644 --- a/.github/workflows/compile.yml +++ b/.github/workflows/compile.yml @@ -95,6 +95,28 @@ jobs: python generate.py --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti cat ./output_aoti + echo "******************************************" + echo "******* INT4 channel-wise quantized ******" + echo "******************************************" + python generate.py --quant '{"linear:int4" : {"bitwidth": 8, "group_size": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager + cat ./output_eager + python generate.py --compile --quant '{"linear:int4" : {"bitwidth": 8, "group_size": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled + cat ./output_compiled + python export.py --quant '{"linear:int4" : {"bitwidth": 8, "group_size": 0}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so + python generate.py --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti + cat ./output_aoti + + echo "******************************************" + echo "******** INT4 group-wise quantized *******" + echo "******************************************" + python generate.py --quant '{"linear:int4" : {"bitwidth": 8, "group_size": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager + cat ./output_eager + python generate.py --compile --quant '{"linear:int4" : {"bitwidth": 8, "group_size": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled + cat ./output_compiled + python export.py --quant '{"linear:int4" : {"bitwidth": 8, "group_size": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so + python generate.py --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti + cat ./output_aoti + echo "tests complete" echo "******************************************" # echo "********* EAGER vs TORCH.COMPILE *********"