Fix reporting backends and dtyep to benchmark results (#6023)

Guang Yang · facebook-github-bot · commit 012cba9a1daf · 2024-10-09T14:48:32.000-07:00
Summary: Couple minor fixes for reporting the benchmarking results: - qnn models are not reporting "backend" and "dtype" info in the benchmark_results.json (Android) - tinyllama mdoel is not reporting "backend" and "dtype" info in the benchmark_results.json (Android) - include compute precision to the exported coreml model name - rename "llama2" to "tinyllama" to eliminate confusion (many people thought it was llama2-7b) Pull Request resolved: #6023 Reviewed By: huydhn Differential Revision: D64074262 Pulled By: guangy10 fbshipit-source-id: c6c53d004c4fb3ad410a792639af2c22a6978b67
diff --git a/.ci/scripts/test_llama.sh b/.ci/scripts/test_llama.sh
@@ -171,7 +171,7 @@ else
 fi
 
 # Check dtype.
-EXPORTED_MODEL_NAME="llama2"
+EXPORTED_MODEL_NAME="tinyllama_${MODE}_${DTYPE}"
 if [[ "${DTYPE}" == "fp16" ]]; then
   EXPORTED_MODEL_NAME="${EXPORTED_MODEL_NAME}_h"
 elif [[ "${DTYPE}" == "bf16" ]]; then
diff --git a/.ci/scripts/test_model.sh b/.ci/scripts/test_model.sh
@@ -155,30 +155,24 @@ test_model_with_qnn() {
 
   if [[ "${MODEL_NAME}" == "dl3" ]]; then
     EXPORT_SCRIPT=deeplab_v3
-    EXPORTED_MODEL_NAME=dlv3_qnn.pte
   elif [[ "${MODEL_NAME}" == "mv3" ]]; then
     EXPORT_SCRIPT=mobilenet_v3
-    EXPORTED_MODEL_NAME=mv3_qnn.pte
   elif [[ "${MODEL_NAME}" == "mv2" ]]; then
     EXPORT_SCRIPT=mobilenet_v2
-    EXPORTED_MODEL_NAME=mv2_qnn.pte
   elif [[ "${MODEL_NAME}" == "ic4" ]]; then
     EXPORT_SCRIPT=inception_v4
-    EXPORTED_MODEL_NAME=ic4_qnn.pte
   elif [[ "${MODEL_NAME}" == "ic3" ]]; then
     EXPORT_SCRIPT=inception_v3
-    EXPORTED_MODEL_NAME=ic3_qnn.pte
   elif [[ "${MODEL_NAME}" == "vit" ]]; then
     EXPORT_SCRIPT=torchvision_vit
-    EXPORTED_MODEL_NAME=vit_qnn.pte
   fi
 
   # Use SM8450 for S22, SM8550 for S23, and SM8560 for S24
   # TODO(guangyang): Make QNN chipset matches the target device
   QNN_CHIPSET=SM8450
 
   "${PYTHON_EXECUTABLE}" -m examples.qualcomm.scripts.${EXPORT_SCRIPT} -b ${CMAKE_OUTPUT_DIR} -m ${QNN_CHIPSET} --compile_only
-  EXPORTED_MODEL=./${EXPORT_SCRIPT}/${EXPORTED_MODEL_NAME}
+  EXPORTED_MODEL=$(find "./${EXPORT_SCRIPT}" -type f -name "${MODEL_NAME}*.pte" -print -quit)
 }
 
 test_model_with_coreml() {
@@ -187,8 +181,20 @@ test_model_with_coreml() {
     exit 1
   fi
 
-  "${PYTHON_EXECUTABLE}" -m examples.apple.coreml.scripts.export --model_name="${MODEL_NAME}"
+  DTYPE=float16
+
+  "${PYTHON_EXECUTABLE}" -m examples.apple.coreml.scripts.export --model_name="${MODEL_NAME}" --compute_precision "${DTYPE}"
   EXPORTED_MODEL=$(find "." -type f -name "${MODEL_NAME}*.pte" -print -quit)
+  # TODO:
+  if [ -n "$EXPORTED_MODEL" ]; then
+    EXPORTED_MODEL_WITH_DTYPE="${EXPORTED_MODEL%.pte}_${DTYPE}.pte"
+    mv "$EXPORTED_MODEL" "$EXPORTED_MODEL_WITH_DTYPE"
+    EXPORTED_MODEL="$EXPORTED_MODEL_WITH_DTYPE"
+    echo "Renamed file path: $EXPORTED_MODEL"
+  else
+    echo "No .pte file found"
+    exit 1
+  fi
 }
 
 if [[ "${BACKEND}" == "portable" ]]; then
diff --git a/examples/qualcomm/scripts/deeplab_v3.py b/examples/qualcomm/scripts/deeplab_v3.py
@@ -81,7 +81,7 @@ def main(args):
             data_size=data_num, dataset_dir=args.artifact, download=args.download
         )
 
-    pte_filename = "dlv3_qnn"
+    pte_filename = "dl3_qnn_q8"
     instance = DeepLabV3ResNet101Model()
 
     build_executorch_binary(
diff --git a/examples/qualcomm/scripts/edsr.py b/examples/qualcomm/scripts/edsr.py
@@ -107,7 +107,7 @@ def main(args):
     )
 
     inputs, targets, input_list = dataset.lr, dataset.hr, dataset.get_input_list()
-    pte_filename = "edsr_qnn"
+    pte_filename = "edsr_qnn_q8"
     instance = EdsrModel()
 
     build_executorch_binary(
diff --git a/examples/qualcomm/scripts/inception_v3.py b/examples/qualcomm/scripts/inception_v3.py
@@ -46,7 +46,7 @@ def main(args):
             image_shape=(256, 256),
             crop_size=224,
         )
-    pte_filename = "ic3_qnn"
+    pte_filename = "ic3_qnn_q8"
     instance = InceptionV3Model()
     build_executorch_binary(
         instance.get_eager_model().eval(),
diff --git a/examples/qualcomm/scripts/inception_v4.py b/examples/qualcomm/scripts/inception_v4.py
@@ -45,7 +45,7 @@ def main(args):
             data_size=data_num,
             image_shape=(299, 299),
         )
-    pte_filename = "ic4_qnn"
+    pte_filename = "ic4_qnn_q8"
     instance = InceptionV4Model()
     build_executorch_binary(
         instance.get_eager_model().eval(),
diff --git a/examples/qualcomm/scripts/mobilenet_v2.py b/examples/qualcomm/scripts/mobilenet_v2.py
@@ -46,7 +46,7 @@ def main(args):
             image_shape=(256, 256),
             crop_size=224,
         )
-    pte_filename = "mv2_qnn"
+    pte_filename = "mv2_qnn_q8"
     instance = MV2Model()
     build_executorch_binary(
         instance.get_eager_model().eval(),
diff --git a/examples/qualcomm/scripts/mobilenet_v3.py b/examples/qualcomm/scripts/mobilenet_v3.py
@@ -45,7 +45,7 @@ def main(args):
             image_shape=(256, 256),
             crop_size=224,
         )
-    pte_filename = "mv3_qnn"
+    pte_filename = "mv3_qnn_float16"
     instance = MV3Model()
     build_executorch_binary(
         instance.get_eager_model().eval(),
diff --git a/examples/qualcomm/scripts/torchvision_vit.py b/examples/qualcomm/scripts/torchvision_vit.py
@@ -38,7 +38,7 @@ def main(args):
             crop_size=224,
         )
 
-    pte_filename = "vit_qnn"
+    pte_filename = "vit_qnn_q8"
     instance = TorchVisionViTModel()
     build_executorch_binary(
         instance.get_eager_model().eval(),

Original file line number	Diff line number	Diff line change
`@@ -81,7 +81,7 @@ def main(args):`
`81`	`81`	`data_size=data_num, dataset_dir=args.artifact, download=args.download`
`82`	`82`	`)`
`83`	`83`
`84`		`- pte_filename = "dlv3_qnn"`
	`84`	`+ pte_filename = "dl3_qnn_q8"`
`85`	`85`	`instance = DeepLabV3ResNet101Model()`
`86`	`86`
`87`	`87`	`build_executorch_binary(`
Original file line number	Diff line number	Diff line change
`@@ -107,7 +107,7 @@ def main(args):`
`107`	`107`	`)`
`108`	`108`
`109`	`109`	`inputs, targets, input_list = dataset.lr, dataset.hr, dataset.get_input_list()`
`110`		`- pte_filename = "edsr_qnn"`
	`110`	`+ pte_filename = "edsr_qnn_q8"`
`111`	`111`	`instance = EdsrModel()`
`112`	`112`
`113`	`113`	`build_executorch_binary(`
Original file line number	Diff line number	Diff line change
`@@ -46,7 +46,7 @@ def main(args):`
`46`	`46`	`image_shape=(256, 256),`
`47`	`47`	`crop_size=224,`
`48`	`48`	`)`
`49`		`- pte_filename = "ic3_qnn"`
	`49`	`+ pte_filename = "ic3_qnn_q8"`
`50`	`50`	`instance = InceptionV3Model()`
`51`	`51`	`build_executorch_binary(`
`52`	`52`	`instance.get_eager_model().eval(),`
Original file line number	Diff line number	Diff line change
`@@ -45,7 +45,7 @@ def main(args):`
`45`	`45`	`data_size=data_num,`
`46`	`46`	`image_shape=(299, 299),`
`47`	`47`	`)`
`48`		`- pte_filename = "ic4_qnn"`
	`48`	`+ pte_filename = "ic4_qnn_q8"`
`49`	`49`	`instance = InceptionV4Model()`
`50`	`50`	`build_executorch_binary(`
`51`	`51`	`instance.get_eager_model().eval(),`
Original file line number	Diff line number	Diff line change
`@@ -38,7 +38,7 @@ def main(args):`
`38`	`38`	`crop_size=224,`
`39`	`39`	`)`
`40`	`40`
`41`		`- pte_filename = "vit_qnn"`
	`41`	`+ pte_filename = "vit_qnn_q8"`
`42`	`42`	`instance = TorchVisionViTModel()`
`43`	`43`	`build_executorch_binary(`
`44`	`44`	`instance.get_eager_model().eval(),`