refactor the transform as a standalone function

cccclai · facebook-github-bot · commit 3f637ccc61f6 · 2024-03-22T09:40:43.000-07:00
Summary: Move the transform passes to a standalone function so it's easy to reuse.

Reviewed By: mergennachin

Differential Revision: D55230973
diff --git a/backends/qualcomm/utils/utils.py b/backends/qualcomm/utils/utils.py
@@ -85,27 +85,10 @@ def canonicalize_program(prog: ExportedProgram):
                 QNN_COMPILE_SPEC, convert_to_flatbuffer(options)
             )
 
-
-def capture_program(
-    module: torch.nn.Module,
-    inputs: Tuple[torch.Tensor],
-) -> exir.ExirExportedProgram:
-    # TODO: should switch to torch.export.export & custom deomposition
-    #       to reduce maintaining effort.
-    exir_exported_program = exir.capture(
-        module,
-        inputs,
-        qnn_capture_config(),
-    )
-    # We choose call_operator by target in ConvertBinaryOpsWithScalar
-    # because it is the same source_fn_stack for MultiheadAttention
-    exir_exported_program.transform(ConvertBinaryOpsWithScalar())
-    ex_prog = exir_exported_program.to_edge(qnn_edge_config())
-
+def _transform(edge_program: ExportedProgram) -> None:
     # currently ExirExportedProgram.transform does not accept
     # changes of input number which was caused by FoldQDQ
     # apply passes one by one here to avoid IR capture failure
-    edge_program = ex_prog.exported_program
     graph_module = edge_program.graph_module
     RemoveClone()(graph_module)
     RecomposePixelShuffle()(graph_module)
@@ -121,6 +104,23 @@ def capture_program(
     FoldQDQ()(graph_module)
     InsertRequantize(edge_program)(graph_module)
     LayoutTransform(edge_program)(graph_module)
+
+def capture_program(
+    module: torch.nn.Module,
+    inputs: Tuple[torch.Tensor],
+) -> exir.ExirExportedProgram:
+    # TODO: should switch to torch.export.export & custom deomposition
+    #       to reduce maintaining effort.
+    exir_exported_program = exir.capture(
+        module,
+        inputs,
+        qnn_capture_config(),
+    )
+    # We choose call_operator by target in ConvertBinaryOpsWithScalar
+    # because it is the same source_fn_stack for MultiheadAttention
+    exir_exported_program.transform(ConvertBinaryOpsWithScalar())
+    ex_prog = exir_exported_program.to_edge(qnn_edge_config())
+    _transform(ex_prog.exported_program)
     return ex_prog