Move module level accelerate import to be function level

samruds · samruds · commit cb387bc5bdaa · 2024-03-29T12:39:10.000-07:00
diff --git a/src/sagemaker/serve/detector/dependency_manager.py b/src/sagemaker/serve/detector/dependency_manager.py
@@ -54,9 +54,9 @@ def capture_dependencies(dependencies: dict, work_dir: Path, capture_all: bool =
 
         with open(path, "r") as f:
             autodetect_depedencies = f.read().splitlines()
-        autodetect_depedencies.append("sagemaker>=2.199")
+        autodetect_depedencies.append("sagemaker[huggingface]>=2.199")
     else:
-        autodetect_depedencies = ["sagemaker>=2.199"]
+        autodetect_depedencies = ["sagemaker[huggingface]>=2.199"]
 
     module_version_dict = _parse_dependency_list(autodetect_depedencies)
 
diff --git a/src/sagemaker/serve/utils/hardware_detector.py b/src/sagemaker/serve/utils/hardware_detector.py
@@ -18,9 +18,7 @@
 
 from botocore.exceptions import ClientError
 
-from accelerate.commands.estimate import estimate_command_parser, gather_data
 from sagemaker import Session
-from sagemaker.model import Model
 from sagemaker import instance_types_gpu_info
 
 logger = logging.getLogger(__name__)
@@ -116,18 +114,23 @@ def _format_instance_type(instance_type: str) -> str:
     return ec2_instance
 
 
-def _total_inference_model_size_mib(model: Model, dtype: str) -> int:
+def _total_inference_model_size_mib(model: str, dtype: str) -> int:
     """Calculates the model size from HF accelerate
 
     This function gets the model size from accelerate. It also adds a
     padding and converts to size MiB. When performing inference, expect
      to add up to an additional 20% to the given model size as found by EleutherAI.
     """
-    args = estimate_command_parser().parse_args([model, "--dtypes", dtype])
-
-    output = gather_data(
-        args
-    )  # "dtype", "Largest Layer", "Total Size Bytes", "Training using Adam"
+    try:
+        from accelerate.commands.estimate import estimate_command_parser, gather_data
+        args = estimate_command_parser().parse_args([model, "--dtypes", dtype])
+
+        output = gather_data(
+            args
+        )  # "dtype", "Largest Layer", "Total Size Bytes", "Training using Adam"
+    except ImportError:
+        logger.error("Install HuggingFace extras dependencies using pip install 'sagemaker["
+                     "huggingface]>=2.212.0'")
 
     if output is None:
         raise ValueError(f"Could not get Model size for {model}")