From 3258c995c0c1bbdadd5a84455ebea944f9b3094b Mon Sep 17 00:00:00 2001 From: Jack-Khuu Date: Thu, 20 Feb 2025 17:38:36 -0800 Subject: [PATCH 1/2] Update test-tinystories-executorch: Disable config mobile-32, fix typo --- .github/workflows/pull.yml | 13 ++++++------- 1 file changed, 6 insertions(+), 7 deletions(-) diff --git a/.github/workflows/pull.yml b/.github/workflows/pull.yml index ef98e2eda..08aef5f65 100644 --- a/.github/workflows/pull.yml +++ b/.github/workflows/pull.yml @@ -515,12 +515,11 @@ jobs: python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte echo "******************************************" - echo "*** can't test --quantize torchchat/quant_config/mobile.json ***" - echo "*** testing --quantize torchchat/quant_config/mobile-32.json ***" + echo "*** [TEST DISABLED] Can't test --quantize torchchat/quant_config/mobile.json ***" + echo "*** Testing --quantize torchchat/quant_config/mobile-32.json instead ***" echo "******************************************" - python torchchat.py export --quantize torchchat/quant_config/mobile-32.json --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte - python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte - + # python torchchat.py export --quantize torchchat/quant_config/mobile-32.json --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte + # python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte echo "******************************************" echo "******* Emb: channel-wise quantized ******" @@ -537,13 +536,13 @@ jobs: echo "******************************************" echo "**** Emb 4bit: channel-wise quantized ****" echo "******************************************" - python torchchat.py export --quant '{"embedding" : {"bitwidth": 8, "groupsize": 0}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte + python torchchat.py export --quant '{"embedding" : {"bitwidth": 4, "groupsize": 0}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte echo "******************************************" echo "****** Emb 4bit: group-wise quantized ****" echo "******************************************" - python torchchat.py export --quant '{"embedding" : {"bitwidth": 8, "groupsize": 8}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte + python torchchat.py export --quant '{"embedding" : {"bitwidth": 4, "groupsize": 8}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte echo "******************************************" From 56c749a7e135224cdc43efc5375c7a86c4faf9af Mon Sep 17 00:00:00 2001 From: Jack-Khuu Date: Thu, 20 Feb 2025 18:07:39 -0800 Subject: [PATCH 2/2] Disable bitwidth 4 test --- .github/workflows/pull.yml | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/.github/workflows/pull.yml b/.github/workflows/pull.yml index 08aef5f65..556d9e99f 100644 --- a/.github/workflows/pull.yml +++ b/.github/workflows/pull.yml @@ -534,16 +534,16 @@ jobs: python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte echo "******************************************" - echo "**** Emb 4bit: channel-wise quantized ****" + echo "**** [TEST DISABLED] Emb 4bit: channel-wise quantized ****" echo "******************************************" - python torchchat.py export --quant '{"embedding" : {"bitwidth": 4, "groupsize": 0}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte - python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte + # python torchchat.py export --quant '{"embedding" : {"bitwidth": 4, "groupsize": 0}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte + # python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte echo "******************************************" - echo "****** Emb 4bit: group-wise quantized ****" + echo "****** [TEST DISABLED] Emb 4bit: group-wise quantized ****" echo "******************************************" - python torchchat.py export --quant '{"embedding" : {"bitwidth": 4, "groupsize": 8}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte - python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte + # python torchchat.py export --quant '{"embedding" : {"bitwidth": 4, "groupsize": 8}}' --checkpoint-path ${MODEL_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte + # python3 torchchat.py generate --checkpoint-path ${MODEL_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte echo "******************************************" echo "******* INT8 channel-wise quantized ******"