@@ -515,12 +515,11 @@ jobs:
515
515
python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
516
516
517
517
echo "******************************************"
518
- echo "*** can 't test --quantize torchchat/quant_config/mobile.json ***"
519
- echo "*** testing --quantize torchchat/quant_config/mobile-32.json ***"
518
+ echo "*** [TEST DISABLED] Can 't test --quantize torchchat/quant_config/mobile.json ***"
519
+ echo "*** Testing --quantize torchchat/quant_config/mobile-32.json instead ***"
520
520
echo "******************************************"
521
- python torchchat.py export --quantize torchchat/quant_config/mobile-32.json --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
522
- python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
523
-
521
+ # python torchchat.py export --quantize torchchat/quant_config/mobile-32.json --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
522
+ # python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
524
523
525
524
echo "******************************************"
526
525
echo "******* Emb: channel-wise quantized ******"
@@ -535,16 +534,16 @@ jobs:
535
534
python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
536
535
537
536
echo "******************************************"
538
- echo "**** Emb 4bit: channel-wise quantized ****"
537
+ echo "**** [TEST DISABLED] Emb 4bit: channel-wise quantized ****"
539
538
echo "******************************************"
540
- python torchchat.py export --quant '{"embedding" : {"bitwidth": 8 , "groupsize": 0}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
541
- python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
539
+ # python torchchat.py export --quant '{"embedding" : {"bitwidth": 4 , "groupsize": 0}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
540
+ # python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
542
541
543
542
echo "******************************************"
544
- echo "****** Emb 4bit: group-wise quantized ****"
543
+ echo "****** [TEST DISABLED] Emb 4bit: group-wise quantized ****"
545
544
echo "******************************************"
546
- python torchchat.py export --quant '{"embedding" : {"bitwidth": 8 , "groupsize": 8}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
547
- python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
545
+ # python torchchat.py export --quant '{"embedding" : {"bitwidth": 4 , "groupsize": 8}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
546
+ # python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
548
547
549
548
echo "******************************************"
550
549
echo "******* INT8 channel-wise quantized ******"
0 commit comments