|
43 | 43 | from sagemaker.serve.utils import task
|
44 | 44 | from sagemaker.serve.utils.exceptions import TaskNotFoundException
|
45 | 45 | from sagemaker.serve.utils.predictors import _get_local_mode_predictor
|
46 |
| -from sagemaker.serve.utils.hardware_detector import _get_gpu_info, _get_gpu_info_fallback,\ |
47 |
| - _total_inference_model_size_mib |
| 46 | +from sagemaker.serve.utils.hardware_detector import ( |
| 47 | + _get_gpu_info, |
| 48 | + _get_gpu_info_fallback, |
| 49 | + _total_inference_model_size_mib, |
| 50 | +) |
48 | 51 | from sagemaker.serve.detector.image_detector import (
|
49 | 52 | auto_detect_container,
|
50 | 53 | _detect_framework_and_version,
|
@@ -724,12 +727,15 @@ def _can_fit_on_single_gpu(self) -> Type[bool]:
|
724 | 727 | """
|
725 | 728 | try:
|
726 | 729 | single_gpu_size_mib = self._try_fetch_gpu_info()
|
727 |
| - if _total_inference_model_size_mib(self.model, self.env_vars.get("dtypes", "float32")) \ |
728 |
| - <= single_gpu_size_mib: |
| 730 | + if ( |
| 731 | + _total_inference_model_size_mib(self.model, self.env_vars.get("dtypes", "float32")) |
| 732 | + <= single_gpu_size_mib |
| 733 | + ): |
729 | 734 | logger.info(
|
730 | 735 | "Total inference model size MIB %s, single GPU size for instance MIB %s",
|
731 |
| - _total_inference_model_size_mib(self.model, self.env_vars.get("dtypes", |
732 |
| - "float32")), |
| 736 | + _total_inference_model_size_mib( |
| 737 | + self.model, self.env_vars.get("dtypes", "float32") |
| 738 | + ), |
733 | 739 | single_gpu_size_mib,
|
734 | 740 | )
|
735 | 741 | return True
|
|
0 commit comments