51
51
python generate.py --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
52
52
cat ./output_aoti
53
53
54
- # echo "******************************************"
55
- # echo "******* Emb: channel-wise quantized ******"
56
- # echo "******************************************"
54
+ echo "******************************************"
55
+ echo "******* Emb: channel-wise quantized ******"
56
+ echo "******************************************"
57
57
python generate.py --quant '{"embedding" : {"bitwidth": 8, "group_size": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
58
58
cat ./output_eager
59
59
python generate.py --compile --quant '{"embedding" : {"bitwidth": 8, "group_size": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
@@ -62,20 +62,20 @@ jobs:
62
62
python generate.py --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
63
63
cat ./output_aoti
64
64
65
- # echo "******************************************"
66
- # echo "******** Emb: group-wise quantized *******"
67
- # echo "******************************************"
65
+ echo "******************************************"
66
+ echo "******** Emb: group-wise quantized *******"
67
+ echo "******************************************"
68
68
python generate.py --quant '{"embedding" : {"bitwidth": 8, "group_size": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
69
69
cat ./output_eager
70
70
python generate.py --compile --quant '{"embedding" : {"bitwidth": 8, "group_size": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
71
71
cat ./output_compiled
72
- python export.py --quant "embedding" : {"bitwidth": 8, "group_size": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
72
+ python export.py --quant '{ "embedding" : {"bitwidth": 8, "group_size": 8}}' --checkpoint-path ${MODEL_PATH} --output-dso-path ${MODEL_DIR}/${MODEL_NAME}.so
73
73
python generate.py --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
74
74
cat ./output_aoti
75
75
76
- # echo "******************************************"
77
- # echo "******* INT8 channel-wise quantized ******"
78
- # echo "******************************************"
76
+ echo "******************************************"
77
+ echo "******* INT8 channel-wise quantized ******"
78
+ echo "******************************************"
79
79
python generate.py --quant '{"linear:int8" : {"bitwidth": 8, "group_size": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
80
80
cat ./output_eager
81
81
python generate.py --compile --quant '{"linear:int8" : {"bitwidth": 8, "group_size": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
84
84
python generate.py --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
85
85
cat ./output_aoti
86
86
87
- # echo "******************************************"
88
- # echo "******** INT8 group-wise quantized *******"
89
- # echo "******************************************"
87
+ echo "******************************************"
88
+ echo "******** INT8 group-wise quantized *******"
89
+ echo "******************************************"
90
90
python generate.py --quant '{"linear:int8" : {"bitwidth": 8, "group_size": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_eager
91
91
cat ./output_eager
92
92
python generate.py --compile --quant '{"linear:int8" : {"bitwidth": 8, "group_size": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0 > ./output_compiled
95
95
python generate.py --checkpoint-path ${MODEL_PATH} --temperature 0 --dso-path ${MODEL_DIR}/${MODEL_NAME}.so > ./output_aoti
96
96
cat ./output_aoti
97
97
98
- echo "tests complete"
99
-
100
- # echo "******************************************"
98
+ echo "tests complete"
99
+ echo "******************************************"
101
100
# echo "********* EAGER vs TORCH.COMPILE *********"
102
101
# echo "******************************************"
103
102
# diff output_eager output_compiled
0 commit comments