[ExecuTorch] Allow setting dtype to bf16 in export_llama

swolchok · swolchok · commit f812d592e8ed · 2024-08-30T16:33:11.000-07:00
Pull Request resolved: #4985 Support creating bf16 PTEs. ghstack-source-id: 240577203 @exported-using-ghexport Differential Revision: [D61981363](https://our.internmc.facebook.com/intern/diff/D61981363/)
diff --git a/examples/models/llama2/export_llama_lib.py b/examples/models/llama2/export_llama_lib.py
@@ -256,9 +256,9 @@ def build_args_parser() -> argparse.ArgumentParser:
         "--dtype-override",
         default="fp32",
         type=str,
-        choices=["fp32", "fp16"],
+        choices=["fp32", "fp16", "bf16"],
         help="Override the dtype of the model (default is the checkpoint dtype)."
-        "Options: fp32, fp16. Please be aware that only some backends support fp16.",
+        "Options: fp32, fp16, bf16. Please be aware that only some backends support fp16 and bf16.",
     )
 
     parser.add_argument(
diff --git a/extension/llm/export/builder.py b/extension/llm/export/builder.py
@@ -46,6 +46,7 @@ def to_torch_dtype(self) -> torch.dtype:
         mapping = {
             DType.fp32: torch.float32,
             DType.fp16: torch.float16,
+            DType.bf16: torch.bfloat16,
         }
         if self not in mapping:
             raise ValueError(f"Unsupported dtype {self}")

Original file line number	Diff line number	Diff line change
`@@ -46,6 +46,7 @@ def to_torch_dtype(self) -> torch.dtype:`
`46`	`46`	`mapping = {`
`47`	`47`	`DType.fp32: torch.float32,`
`48`	`48`	`DType.fp16: torch.float16,`
	`49`	`+ DType.bf16: torch.bfloat16,`
`49`	`50`	`}`
`50`	`51`	`if self not in mapping:`
`51`	`52`	`raise ValueError(f"Unsupported dtype {self}")`