pytorch
diff --git a/‎backends/apple/coreml/compiler/coreml_preprocess.py
Lines changed: 208 additions & 25 deletions b/‎backends/apple/coreml/compiler/coreml_preprocess.py
Lines changed: 208 additions & 25 deletions
diff --git a/‎backends/apple/coreml/partition/coreml_partitioner.py
Lines changed: 10 additions & 3 deletions b/‎backends/apple/coreml/partition/coreml_partitioner.py
Lines changed: 10 additions & 3 deletions
diff --git a/‎backends/apple/coreml/runtime/delegate/ETCoreMLLogging.h
Lines changed: 1 addition & 0 deletions b/‎backends/apple/coreml/runtime/delegate/ETCoreMLLogging.h
Lines changed: 1 addition & 0 deletions
diff --git a/‎backends/apple/coreml/runtime/delegate/ETCoreMLModelCompiler.mm
Lines changed: 12 additions & 0 deletions b/‎backends/apple/coreml/runtime/delegate/ETCoreMLModelCompiler.mm
Lines changed: 12 additions & 0 deletions
@@ -5,10 +5,12 @@
 import json
 import shutil
 import uuid
+from dataclasses import asdict, dataclass
+from enum import Enum
 
 from pathlib import Path
 
-from typing import final, List
+from typing import Dict, final, List
 
 import coremltools as ct
 import executorchcoreml
@@ -21,56 +23,237 @@
 from executorch.exir.backend.compile_spec_schema import CompileSpec
 
 
+class COMPILE_SPEC_KEYS(Enum):
+    COMPUTE_UNITS = "compute_units"
+    MODEL_TYPE = "model_type"
+    MIN_DEPLOYMENT_TARGET = "min_deployment_target"
+    MODEL_COMPUTE_PRECISION = "model_compute_precision"
+
+
+@dataclass
+class ModelMetadata:
+    # The model input names.
+    inputNames: List[str]
+    # The model output names.
+    outputNames: List[str]
+    # The model identifier.
+    identifier: str
+
+
 @final
 class CoreMLBackend(BackendDetails):
+    class MODEL_TYPE(Enum):
+        MODEL = "model"
+        COMPILED_MODEL = "compiled_model"
+
+    @staticmethod
+    def generate_model_type_compile_spec(model_type: MODEL_TYPE) -> CompileSpec:
+        """
+        Returns the compile spec representing the given model type.
+
+        If the model type is ``MODEL_TYPE.Model`` then the ``CoreMLBackend`` returns
+        the in-memory representation of the ``mlpackage`` contents.
+
+        If the model type is ``MODEL_TYPE.COMPILED_MODEL`` then the ``CoreMLBackend`` compiles the model
+        and returns the in-memory representation of ``mlmodelc`` (compiled model) contents.
+        """
+        return CompileSpec(
+            COMPILE_SPEC_KEYS.MODEL_TYPE.value, model_type.value.encode("utf-8")
+        )
+
+    @staticmethod
+    def model_type_from_compile_specs(compile_specs: List[CompileSpec]) -> MODEL_TYPE:
+        """
+        Returns the model type by parsing the list of compile specs.
+        """
+        for compile_spec in compile_specs:
+            if compile_spec.key == COMPILE_SPEC_KEYS.MODEL_TYPE.value:
+                return CoreMLBackend.MODEL_TYPE(compile_spec.value.decode("utf-8"))
+
+        return CoreMLBackend.MODEL_TYPE.MODEL
+
+    @staticmethod
+    def generate_compute_precision_compile_spec(
+        compute_precision: ct.precision,
+    ) -> CompileSpec:
+        """
+        Returns the compile spec representing the model compute precision, for additional details
+        please refer to the documentation for ``coremltools.precision``.
+        """
+        return CompileSpec(
+            COMPILE_SPEC_KEYS.MODEL_COMPUTE_PRECISION.value,
+            compute_precision.value.encode("utf-8"),
+        )
+
+    @staticmethod
+    def model_compute_precision_from_compile_specs(
+        compile_specs: List[CompileSpec],
+    ) -> ct.precision:
+        """
+        Returns the model's compute precision by parsing the list of compile specs.
+        """
+        for compile_spec in compile_specs:
+            if compile_spec.key == COMPILE_SPEC_KEYS.MODEL_COMPUTE_PRECISION.value:
+                return ct.precision(compile_spec.value.decode("utf-8"))
+
+        return ct.precision.FLOAT16
+
+    @staticmethod
+    def generate_minimum_deployment_target_compile_spec(
+        min_deployment_target: ct.target,
+    ) -> CompileSpec:
+        """
+        Returns the compile spec representing the minimum deployment target on which the model can run,
+        for additional details please refer to the documentation for ``coremltools.target``.
+        """
+        return CompileSpec(
+            COMPILE_SPEC_KEYS.MIN_DEPLOYMENT_TARGET.value,
+            str(min_deployment_target.value).encode("utf-8"),
+        )
+
+    @staticmethod
+    def min_deployment_target_from_compile_specs(
+        compile_specs: List[CompileSpec],
+    ) -> ct.target:
+        """
+        Returns the minimum deployment target by parsing the list of compile specs.
+        """
+        for compile_spec in compile_specs:
+            if compile_spec.key == COMPILE_SPEC_KEYS.MIN_DEPLOYMENT_TARGET.value:
+                compile_spec_value: int = int(compile_spec.value.decode("utf-8"))
+                return ct.target(compile_spec_value)
+
+        return ct.target.iOS15
+
     @staticmethod
-    def to_bytes(mlmodel):
-        dir_path = Path("tmp")
-        model_dir_path = dir_path / "lowered_module"
-        Path(model_dir_path).mkdir(parents=True, exist_ok=True)
-        model_path = model_dir_path / "model.mlpackage"
-        mlmodel.save(model_path)
-
-        # save model metdata
-        spec = mlmodel.get_spec()
-        input_names = [input.name for input in spec.description.input]
-        output_names = [output.name for output in spec.description.output]
+    def generate_compute_unit_compile_spec(
+        compute_unit: ct.ComputeUnit,
+    ) -> CompileSpec:
+        """
+        Returns the compile spec representing the compute units on which the model can run, for additional details
+        please refer to the documentation for ``coremltools.ComputeUnit`.
+        """
+        return CompileSpec(
+            COMPILE_SPEC_KEYS.COMPUTE_UNITS.value,
+            compute_unit.name.lower().encode("utf-8"),
+        )
+
+    @staticmethod
+    def generate_compile_specs(
+        compute_unit: ct.ComputeUnit = ct.ComputeUnit.ALL,
+        minimum_deployment_target: ct.target = ct.target.iOS15,
+        compute_precision: ct.precision = ct.precision.FLOAT16,
+        model_type: MODEL_TYPE = MODEL_TYPE.MODEL,
+    ) -> List[CompileSpec]:
+        """
+        Returns the list of compile specs that's used by CoreMLBackend to lower the module.
+        """
+        compile_specs: List[CompileSpec] = []
+        compile_specs.append(
+            CoreMLBackend.generate_compute_unit_compile_spec(compute_unit)
+        )
+        compile_specs.append(
+            CoreMLBackend.generate_minimum_deployment_target_compile_spec(
+                minimum_deployment_target
+            )
+        )
+        compile_specs.append(
+            CoreMLBackend.generate_compute_precision_compile_spec(compute_precision)
+        )
+        compile_specs.append(CoreMLBackend.generate_model_type_compile_spec(model_type))
+
+        return compile_specs
+
+    @staticmethod
+    def model_metadata_from_spec(model_spec: ct.proto.Model_pb2) -> Dict[str, str]:
+        input_names: List[str] = [input.name for input in model_spec.description.input]
+        output_names = [output.name for output in model_spec.description.output]
         identifier = uuid.uuid4()
 
-        model_metadata = {
-            "inputNames": input_names,
-            "outputNames": output_names,
-            "identifier": str(identifier),
-        }
+        return ModelMetadata(
+            inputNames=input_names, outputNames=output_names, identifier=str(identifier)
+        )
+
+    @staticmethod
+    def to_bytes(mlmodel: ct.models.MLModel, model_type: MODEL_TYPE) -> bytes:
+        dir_path: Path = Path("tmp")
+        model_dir_path: Path = dir_path / "lowered_module"
+        model_spec: ct.proto.Model_pb2 = mlmodel.get_spec()
+        model_metadata: ModelMetadata = CoreMLBackend.model_metadata_from_spec(
+            model_spec
+        )
+        match model_type:
+            case CoreMLBackend.MODEL_TYPE.MODEL:
+                # Store model.
+                model_path = model_dir_path / "model.mlpackage"
+                mlmodel.save(model_path)
 
-        # store metadata
+            case CoreMLBackend.MODEL_TYPE.COMPILED_MODEL:
+                # Store compiled model
+                model_path = model_dir_path / "model.mlmodelc"
+                compiled_model_path = mlmodel.get_compiled_model_path()
+
+                shutil.copytree(
+                    compiled_model_path,
+                    str(model_path.resolve()),
+                    dirs_exist_ok=True,
+                )
+
+        # Store model metadata.
         model_metadata_path = Path(model_dir_path) / "metadata.json"
-        json_object = json.dumps(model_metadata)
+        model_metadata_json = json.dumps(asdict(model_metadata))
         with open(model_metadata_path, "w") as outfile:
-            outfile.write(json_object)
+            outfile.write(model_metadata_json)
 
         # flatten directory contents and convert it to bytes
         flattened_bytes = executorchcoreml.flatten_directory_contents(
             str(model_dir_path.resolve())
         )
+
         shutil.rmtree(str(model_dir_path.resolve()))
         return flattened_bytes
 
     @classmethod
-    # pyre-ignore
     def preprocess(
         cls,
         edge_program: ExportedProgram,
-        module_compile_spec: List[CompileSpec],
+        module_compile_specs: List[CompileSpec],
     ) -> PreprocessResult:
+        model_type: CoreMLBackend.MODEL_TYPE = (
+            CoreMLBackend.model_type_from_compile_specs(
+                module_compile_specs,
+            )
+        )
+
+        model_compute_precision: ct.precision = (
+            CoreMLBackend.model_compute_precision_from_compile_specs(
+                module_compile_specs
+            )
+        )
+
+        minimum_deployment_target: ct.target = (
+            CoreMLBackend.min_deployment_target_from_compile_specs(module_compile_specs)
+        )
+
+        skip_model_load: bool = False
+        match model_type:
+            case CoreMLBackend.MODEL_TYPE.MODEL:
+                skip_model_load = True
+
+            case CoreMLBackend.MODEL_TYPE.COMPILED_MODEL:
+                skip_model_load = False
+
         mlmodel = ct.convert(
             model=edge_program,
             source="pytorch",
             convert_to="mlprogram",
             pass_pipeline=ct.PassPipeline.DEFAULT,
-            skip_model_load=True,
+            skip_model_load=skip_model_load,
+            compute_precision=model_compute_precision,
+            minimum_deployment_target=minimum_deployment_target,
         )
-        flattened_bytes = CoreMLBackend.to_bytes(mlmodel)
+
+        processed_bytes = CoreMLBackend.to_bytes(mlmodel, model_type=model_type)
         return PreprocessResult(
-            processed_bytes=flattened_bytes,
+            processed_bytes=processed_bytes,
         )
@@ -9,6 +9,9 @@
 
 import torch
 
+from executorch.backends.apple.coreml.compiler import CoreMLBackend
+from executorch.exir.backend.compile_spec_schema import CompileSpec
+
 from executorch.exir.backend.partitioner import (
     DelegationSpec,
     Partitioner,
@@ -52,15 +55,19 @@ def is_node_supported(self, submodules, node: torch.fx.Node) -> bool:
 
 
 class CoreMLPartitioner(Partitioner):
-    compile_spec = []
 
     def __init__(
-        self, skip_ops_for_coreml_delegation: Optional[List[str]] = None
+        self,
+        skip_ops_for_coreml_delegation: Optional[List[str]] = None,
+        compile_specs: Optional[List[CompileSpec]] = None,
     ) -> None:
         if skip_ops_for_coreml_delegation is None:
             skip_ops_for_coreml_delegation = []
         self.skip_ops_for_coreml_delegation = skip_ops_for_coreml_delegation
-        self.delegation_spec = DelegationSpec("CoreMLBackend", self.compile_spec)
+        self.delegation_spec = DelegationSpec(
+            backend_id=CoreMLBackend.__name__,
+            compile_specs=compile_specs if compile_specs is not None else [],
+        )
 
     def partition(self, exported_program: ExportedProgram) -> PartitionResult:
         # Run the CapabilityBasedPartitioner to return the largest possible
 
@@ -21,6 +21,7 @@ typedef NS_ERROR_ENUM(ETCoreMLErrorDomain, ETCoreMLError) {
     ETCoreMLErrorCorruptedModel, // AOT blob has incorrect or missing CoreML model.
     ETCoreMLErrorBrokenModel, // CoreML model doesn't match the input and output specification.
     ETCoreMLErrorCompilationFailed, // CoreML model failed to compile.
+    ETCoreMLErrorModelCompilationNotSupported, // CoreML model compilation is not supported by the target.
     ETCoreMLErrorModelSaveFailed, // Failed to save CoreML model to disk.
     ETCoreMLErrorModelCacheCreationFailed, // Failed to create model cache.
     ETCoreMLErrorInternalError, // Internal error.
 
@@ -7,12 +7,23 @@
 
 #import <ETCoreMLModelCompiler.h>
 #import <ETCoreMLLogging.h>
+#import <TargetConditionals.h>
 
 @implementation ETCoreMLModelCompiler
 
 + (nullable NSURL *)compileModelAtURL:(NSURL *)modelURL
                  maxWaitTimeInSeconds:(NSTimeInterval)maxWaitTimeInSeconds
                                 error:(NSError* __autoreleasing *)error {
+#if TARGET_OS_WATCH
+    (void)modelURL;
+    (void)maxWaitTimeInSeconds;
+    (void)error;
+    ETCoreMLLogErrorAndSetNSError(error,
+                                  ETCoreMLErrorModelCompilationNotSupported,
+                                  "%@: Model compilation is not supported on the target, please make sure to export a compiled model.",
+                                  NSStringFromClass(ETCoreMLModelCompiler.class));
+    return nil;
+#else
     __block NSError *localError = nil;
     __block NSURL *result = nil;
 
@@ -34,6 +45,7 @@ + (nullable NSURL *)compileModelAtURL:(NSURL *)modelURL
     }
 
     return result;
+#endif
 }
 
 @end