Introduce executorch_ops_check

larryliu0820 · facebook-github-bot · commit 2c592e65b51d · 2024-12-02T10:45:49.000-08:00
Summary: Introducing `executorch_ops_check`. For any given target, find all the `executorch_generated_lib` targets in the dependent transitive closure and make sure the operators in `executorch_generated_lib` are not overlapping.

Differential Revision: D66560425
diff --git a/codegen/tools/gen_all_oplist.py b/codegen/tools/gen_all_oplist.py
@@ -1,31 +1,65 @@
-#!/usr/bin/env fbpython
+#!/usr/bin/env python3
 # Copyright (c) Meta Platforms, Inc. and affiliates.
 # All rights reserved.
 #
 # This source code is licensed under the BSD-style license found in the
 # LICENSE file in the root directory of this source tree.
 
 import argparse
+import re
 import os
 import sys
-from typing import Any, List
+from functools import reduce
+from typing import Any, List, Tuple
 
-from tools_copy.code_analyzer import gen_oplist_copy_from_core
+import yaml
+from torchgen.selective_build.selector import (
+    combine_selective_builders,
+    SelectiveBuilder,
+)
+from pathlib import Path
 
 
+def throw_if_any_op_includes_overloads(selective_builder: SelectiveBuilder) -> None:
+    ops = []
+    for op_name, op in selective_builder.operators.items():
+        if op.include_all_overloads:
+            ops.append(op_name)
+    if ops:
+        raise Exception(  # noqa: TRY002
+            (
+                "Operators that include all overloads are "
+                + "not allowed since --allow-include-all-overloads "
+                + "was not specified: {}"
+            ).format(", ".join(ops))
+        )
+
+def resolve_model_file_path_to_buck_target(model_file_path: str) -> str:
+    real_path = str(Path(model_file_path).resolve(strict=True))
+    # try my best to convert to buck target
+    prog = re.compile(r"/.*/buck-out/.*/(fbsource|fbcode)/[0-9a-f]*/(.*)/__(.*)_et_oplist__/out/selected_operators.yaml")
+    match = prog.match(real_path)
+    if match:
+        return f"{match.group(1)}//{match.group(2)}:{match.group(3)}"
+    else:
+        return real_path
+
 def main(argv: List[Any]) -> None:
-    """This binary is a wrapper for //executorch/codegen/tools/gen_oplist_copy_from_core.py.
-    This is needed because we intend to error out for the case where `model_file_list_path`
-    is empty or invalid, so that the ExecuTorch build will fail when no selective build target
-    is provided as a dependency to ExecuTorch build.
+    """This binary generates 3 files:
+
+    1. selected_mobile_ops.h: Primary operators used by templated selective build and Kernel Function
+       dtypes captured by tracing
+    2. selected_operators.yaml: Selected root and non-root operators (either via tracing or static analysis)
     """
     parser = argparse.ArgumentParser(description="Generate operator lists")
     parser.add_argument(
+        "--output-dir",
         "--output_dir",
         help=("The directory to store the output yaml file (selected_operators.yaml)"),
         required=True,
     )
     parser.add_argument(
+        "--model-file-list-path",
         "--model_file_list_path",
         help=(
             "Path to a file that contains the locations of individual "
@@ -36,6 +70,7 @@ def main(argv: List[Any]) -> None:
         required=True,
     )
     parser.add_argument(
+        "--allow-include-all-overloads",
         "--allow_include_all_overloads",
         help=(
             "Flag to allow operators that include all overloads. "
@@ -46,26 +81,99 @@ def main(argv: List[Any]) -> None:
         default=False,
         required=False,
     )
+    parser.add_argument(
+        "--check-ops-not-overlapping",
+        "--check_ops_not_overlapping",
+        help=(
+            "Flag to check if the operators in the model file list are overlapping. "
+            + "If not set, the script will not error out for overlapping operators."
+        ),
+        action="store_true",
+        default=False,
+        required=False,
+    )
+    options = parser.parse_args(argv)
+
 
-    # check if the build has any dependency on any selective build target. If we have a target, BUCK shold give us either:
+    # Check if the build has any dependency on any selective build target. If we have a target, BUCK shold give us either:
     # 1. a yaml file containing selected ops (could be empty), or
-    # 2. a non-empty list of yaml files in the `model_file_list_path`.
-    # If none of the two things happened, the build target  has no dependency on any selective build and we should error out.
-    options = parser.parse_args(argv)
+    # 2. a non-empty list of yaml files in the `model_file_list_path` or
+    # 3. a non-empty list of directories in the `model_file_list_path`, with each directory containing a `selected_operators.yaml` file.
+    # If none of the 3 things happened, the build target  has no dependency on any selective build and we should error out.
     if os.path.isfile(options.model_file_list_path):
-        pass
+        print("Processing model file: ", options.model_file_list_path)
+        model_dicts = []
+        model_dict = yaml.safe_load(open(options.model_file_list_path))
+        model_dicts.append(model_dict)
     else:
-        assert (
-            options.model_file_list_path[0] == "@"
-        ), "model_file_list_path is not a valid file path, or it doesn't start with '@'. This is likely a BUCK issue."
+        print("Processing model directory: ", options.model_file_list_path)
+        assert options.model_file_list_path[0] == "@" , "model_file_list_path is not a valid file path, or it doesn't start with '@'. This is likely a BUCK issue."
+        
         model_file_list_path = options.model_file_list_path[1:]
+
+        model_dicts = []
         with open(model_file_list_path) as model_list_file:
             model_file_names = model_list_file.read().split()
             assert (
                 len(model_file_names) > 0
             ), "BUCK was not able to find any `et_operator_library` in the dependency graph of the current ExecuTorch "
             "build. Please refer to Selective Build wiki page to add at least one."
-    gen_oplist_copy_from_core.main(argv)
+            for model_file_name in model_file_names:
+                if not os.path.isfile(model_file_name):
+                    model_file_name = os.path.join(model_file_name, "selected_operators.yaml")
+                print("Processing model file: ", model_file_name)
+                assert os.path.isfile(model_file_name), f"{model_file_name} is not a valid file path. This is likely a BUCK issue."
+                with open(model_file_name, "rb") as model_file:
+                    model_dict = yaml.safe_load(model_file)
+                    resolved = resolve_model_file_path_to_buck_target(model_file_name)
+                    for op in model_dict["operators"]:
+                        model_dict["operators"][op]["debug_info"] = [resolved]
+                    model_dicts.append(model_dict)
+
+    selective_builders = [SelectiveBuilder.from_yaml_dict(m) for m in model_dicts]
+
+    # Optionally check if the operators in the model file list are overlapping.
+    if options.check_ops_not_overlapping:
+        ops = {}
+        for model_dict in model_dicts:
+            for op_name in model_dict["operators"]:
+                if op_name in ops:
+                    debug_info_1 = ','.join(ops[op_name]["debug_info"])
+                    debug_info_2 = ','.join(model_dict["operators"][op_name]["debug_info"])
+                    error = f"Operator {op_name} is used in 2 models: {debug_info_1} and {debug_info_2}"
+                    if "//" not in debug_info_1 and "//" not in debug_info_2:
+                        error += "\nWe can't determine what BUCK targets these model files belong to."
+                        tail = "."
+                    else:
+                        error += "\nPlease run the following commands to find out where is the BUCK target being added as a dependency to your target:\n"
+                        error += f"\n   buck2 cquery <mode> \"allpaths(<target>, {debug_info_1})\""
+                        error += f"\n   buck2 cquery <mode> \"allpaths(<target>, {debug_info_2})\""
+                        tail = "as well as results from BUCK commands listed above."
+
+                    error += "\n\nIf issue is not resolved, please post in PyTorch Edge Q&A with this error message" + tail
+                    raise Exception(error)  # noqa: TRY002
+                ops[op_name] = model_dict["operators"][op_name]
+    # We may have 0 selective builders since there may not be any viable
+    # pt_operator_library rule marked as a dep for the pt_operator_registry rule.
+    # This is potentially an error, and we should probably raise an assertion
+    # failure here. However, this needs to be investigated further.
+    selective_builder = SelectiveBuilder.from_yaml_dict({})
+    if len(selective_builders) > 0:
+        selective_builder = reduce(
+            combine_selective_builders,
+            selective_builders,
+        )
+
+    if not options.allow_include_all_overloads:
+        throw_if_any_op_includes_overloads(selective_builder)
+    with open(
+        os.path.join(options.output_dir, "selected_operators.yaml"), "wb"
+    ) as out_file:
+        out_file.write(
+            yaml.safe_dump(
+                selective_builder.to_dict(), default_flow_style=False
+            ).encode("utf-8"),
+        )
 
 
 if __name__ == "__main__":
diff --git a/codegen/tools/gen_oplist.py b/codegen/tools/gen_oplist.py
@@ -249,7 +249,7 @@ def gen_oplist(
     _dump_yaml(
         sorted(op_set),
         output_path,
-        os.path.basename(source_name) if source_name else None,
+        source_name,
         et_kernel_metadata,
         include_all_operators,
     )
diff --git a/codegen/tools/gen_oplist_copy_from_core.py b/codegen/tools/gen_oplist_copy_from_core.py
diff --git a/codegen/tools/targets.bzl b/codegen/tools/targets.bzl
@@ -78,23 +78,14 @@ def define_common_targets(is_fbcode = False):
         ],
     )
 
-    runtime.python_library(
-        name = "gen_oplist_copy_from_core",
-        srcs = [
-            "gen_oplist_copy_from_core.py",
-        ],
-        base_module = "tools_copy.code_analyzer",
-        external_deps = ["torchgen"],
-    )
-
     runtime.python_library(
         name = "gen_all_oplist_lib",
         srcs = ["gen_all_oplist.py"],
         base_module = "executorch.codegen.tools",
         visibility = [
             "//executorch/...",
         ],
-        deps = [":gen_oplist_copy_from_core"],
+        external_deps = ["torchgen"],
     )
 
     runtime.python_binary(
@@ -130,7 +121,7 @@ def define_common_targets(is_fbcode = False):
         srcs = ["gen_selected_op_variants.py"],
         base_module = "executorch.codegen.tools",
         visibility = ["//executorch/..."],
-        deps = [":gen_oplist_copy_from_core"],
+        deps = [":gen_all_oplist_lib"],
     )
 
     runtime.python_binary(
diff --git a/shim/xplat/executorch/codegen/codegen.bzl b/shim/xplat/executorch/codegen/codegen.bzl
@@ -531,7 +531,7 @@ def executorch_generated_lib(
     )
 
     # genrule for selective build from static operator list
-    oplist_dir_name = name + "_pt_oplist"
+    oplist_dir_name = name + "_et_oplist"
     runtime.genrule(
         name = oplist_dir_name,
         macros_only = False,
@@ -665,3 +665,27 @@ def executorch_generated_lib(
             define_static_target = define_static_targets,
             platforms = platforms,
         )
+
+# Util macro that takes in a binary or a shared library, find targets ending with `_et_oplist` in the transitive closure of deps, 
+# get the `selected_operators.yaml` from those targets, try to merge them into a single yaml. This target will fail to build, if
+# there are intersections of all `selected_operators.yaml` the `target` is depending on.
+#
+# An example failure case: a binary `bin` is depending on 2 `executorch_generated_lib`s and they both register `aten::add.out`
+# with either the same or different kernels associated to it.
+#
+# If build successfully, all of the `selected_operators.yaml` will be merged into 1 `selected_operators.yaml` for debugging purpose.
+def executorch_ops_check(
+    name,
+    target,
+):
+    runtime.genrule(
+        name = name,
+        macros_only = False,
+        cmd = ("$(exe fbsource//xplat/executorch/codegen/tools:gen_all_oplist) " +
+               "--model_file_list_path $(@query_outputs \"filter('.*_et_oplist', deps({target}))\") " +
+               "--allow_include_all_overloads " +
+               "--check_ops_not_overlapping " +
+               "--output_dir $OUT ").format(target=target),
+        outs = {"selected_operators.yaml": ["selected_operators.yaml"]},
+        default_outs = ["."],
+    )

Original file line number	Diff line number	Diff line change
`@@ -249,7 +249,7 @@ def gen_oplist(`
`249`	`249`	`_dump_yaml(`
`250`	`250`	`sorted(op_set),`
`251`	`251`	`output_path,`
`252`		`- os.path.basename(source_name) if source_name else None,`
	`252`	`+ source_name,`
`253`	`253`	`et_kernel_metadata,`
`254`	`254`	`include_all_operators,`
`255`	`255`	`)`