fix: advanced inference recommendation jobs parameters check (#3644)

jinpengqi · Jinpeng Qi · web-flow · commit cc9b286f9977 · 2023-02-14T01:05:09.000-08:00
Co-authored-by: Jinpeng Qi &lt;qijinpen@amazon.com&gt;
diff --git a/src/sagemaker/inference_recommender/__init__.py b/src/sagemaker/inference_recommender/__init__.py
@@ -12,3 +12,7 @@
 # language governing permissions and limitations under the License.
 """Classes for using Inference Recommender with Amazon SageMaker."""
 from __future__ import absolute_import
+from sagemaker.inference_recommender.inference_recommender_mixin import (  # noqa: F401
+    Phase,
+    ModelLatencyThreshold,
+)
diff --git a/src/sagemaker/inference_recommender/inference_recommender_mixin.py b/src/sagemaker/inference_recommender/inference_recommender_mixin.py
@@ -464,18 +464,24 @@ def _convert_to_resource_limit_json(self, max_tests: int, max_parallel_tests: in
         """Bundle right_size() parameters into a resource limit for Advanced job"""
         if not max_tests and not max_parallel_tests:
             return None
-        return {
-            "MaxNumberOfTests": max_tests,
-            "MaxParallelOfTests": max_parallel_tests,
-        }
+        resource_limit = {}
+        if max_tests:
+            resource_limit["MaxNumberOfTests"] = max_tests
+        if max_parallel_tests:
+            resource_limit["MaxParallelOfTests"] = max_parallel_tests
+        return resource_limit
 
     def _convert_to_stopping_conditions_json(
         self, max_invocations: int, model_latency_thresholds: List[ModelLatencyThreshold]
     ):
         """Bundle right_size() parameters into stopping conditions for Advanced job"""
         if not max_invocations and not model_latency_thresholds:
             return None
-        return {
-            "MaxInvocations": max_invocations,
-            "ModelLatencyThresholds": [threshold.to_json for threshold in model_latency_thresholds],
-        }
+        stopping_conditions = {}
+        if max_invocations:
+            stopping_conditions["MaxInvocations"] = max_invocations
+        if model_latency_thresholds:
+            stopping_conditions["ModelLatencyThresholds"] = [
+                threshold.to_json for threshold in model_latency_thresholds
+            ]
+        return stopping_conditions