Skip to content

Commit 9b765b7

Browse files
author
AWS
committed
Amazon SageMaker Service Update: SageMaker Inference Recommender now decouples from Model Registry and could accept Model Name to invoke inference recommendations job; Inference Recommender now provides CPU/Memory Utilization metrics data in recommendation output.
1 parent 5809d7b commit 9b765b7

File tree

2 files changed

+49
-1
lines changed

2 files changed

+49
-1
lines changed
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
{
2+
"type": "feature",
3+
"category": "Amazon SageMaker Service",
4+
"contributor": "",
5+
"description": "SageMaker Inference Recommender now decouples from Model Registry and could accept Model Name to invoke inference recommendations job; Inference Recommender now provides CPU/Memory Utilization metrics data in recommendation output."
6+
}

services/sagemaker/src/main/resources/codegen-resources/service-2.json

Lines changed: 43 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2467,6 +2467,9 @@
24672467
},
24682468
"input":{"shape":"ListInferenceRecommendationsJobStepsRequest"},
24692469
"output":{"shape":"ListInferenceRecommendationsJobStepsResponse"},
2470+
"errors":[
2471+
{"shape":"ResourceNotFound"}
2472+
],
24702473
"documentation":"<p>Returns a list of the subtasks for an Inference Recommender job.</p> <p>The supported subtasks are benchmarks, which evaluate the performance of your model on different instance types.</p>"
24712474
},
24722475
"ListInferenceRecommendationsJobs":{
@@ -18127,6 +18130,10 @@
1812718130
"ModelConfiguration":{
1812818131
"shape":"ModelConfiguration",
1812918132
"documentation":"<p>Defines the model configuration.</p>"
18133+
},
18134+
"RecommendationId":{
18135+
"shape":"String",
18136+
"documentation":"<p>The recommendation ID which uniquely identifies each recommendation.</p>"
1813018137
}
1813118138
},
1813218139
"documentation":"<p>A list of recommendations made by Amazon SageMaker Inference Recommender.</p>"
@@ -23444,6 +23451,10 @@
2344423451
"EnvironmentParameters":{
2344523452
"shape":"EnvironmentParameters",
2344623453
"documentation":"<p>Defines the environment parameters that includes key, value types, and values.</p>"
23454+
},
23455+
"CompilationJobName":{
23456+
"shape":"RecommendationJobCompilationJobName",
23457+
"documentation":"<p>The name of the compilation job used to create the recommended model artifacts.</p>"
2344723458
}
2344823459
},
2344923460
"documentation":"<p>Defines the model configuration. Includes the specification name and environment parameters.</p>"
@@ -28002,6 +28013,12 @@
2800228013
"max":256,
2800328014
"pattern":"arn:aws[a-z\\-]*:sagemaker:[a-z0-9\\-]*:[0-9]{12}:inference-recommendations-job/.*"
2800428015
},
28016+
"RecommendationJobCompilationJobName":{
28017+
"type":"string",
28018+
"max":63,
28019+
"min":1,
28020+
"pattern":"^[a-zA-Z0-9](-*[a-zA-Z0-9]){0,62}$"
28021+
},
2800528022
"RecommendationJobCompiledOutputConfig":{
2800628023
"type":"structure",
2800728024
"members":{
@@ -28042,10 +28059,20 @@
2804228059
"SupportedInstanceTypes":{
2804328060
"shape":"RecommendationJobSupportedInstanceTypes",
2804428061
"documentation":"<p>A list of the instance types that are used to generate inferences in real-time.</p>"
28062+
},
28063+
"DataInputConfig":{
28064+
"shape":"RecommendationJobDataInputConfig",
28065+
"documentation":"<p>Specifies the name and shape of the expected data inputs for your trained model with a JSON dictionary form. This field is used for optimizing your model using SageMaker Neo. For more information, see <a href=\"https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_InputConfig.html#sagemaker-Type-InputConfig-DataInputConfig\">DataInputConfig</a>.</p>"
2804528066
}
2804628067
},
2804728068
"documentation":"<p>Specifies mandatory fields for running an Inference Recommender job directly in the <a href=\"https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateInferenceRecommendationsJob.html\">CreateInferenceRecommendationsJob</a> API. The fields specified in <code>ContainerConfig</code> override the corresponding fields in the model package. Use <code>ContainerConfig</code> if you want to specify these fields for the recommendation job but don't want to edit them in your model package.</p>"
2804828069
},
28070+
"RecommendationJobDataInputConfig":{
28071+
"type":"string",
28072+
"max":1024,
28073+
"min":1,
28074+
"pattern":"[\\S\\s]+"
28075+
},
2804928076
"RecommendationJobDescription":{
2805028077
"type":"string",
2805128078
"max":128
@@ -28066,7 +28093,6 @@
2806628093
},
2806728094
"RecommendationJobInputConfig":{
2806828095
"type":"structure",
28069-
"required":["ModelPackageVersionArn"],
2807028096
"members":{
2807128097
"ModelPackageVersionArn":{
2807228098
"shape":"ModelPackageArn",
@@ -28103,6 +28129,10 @@
2810328129
"VpcConfig":{
2810428130
"shape":"RecommendationJobVpcConfig",
2810528131
"documentation":"<p>Inference Recommender provisions SageMaker endpoints with access to VPC in the inference recommendation job.</p>"
28132+
},
28133+
"ModelName":{
28134+
"shape":"ModelName",
28135+
"documentation":"<p>The name of the created model.</p>"
2810628136
}
2810728137
},
2810828138
"documentation":"<p>The input configuration of the recommendation job.</p>"
@@ -28259,6 +28289,14 @@
2825928289
"ModelLatency":{
2826028290
"shape":"Integer",
2826128291
"documentation":"<p>The expected model latency at maximum invocation per minute for the instance.</p>"
28292+
},
28293+
"CpuUtilization":{
28294+
"shape":"UtilizationMetric",
28295+
"documentation":"<p>The expected CPU utilization at maximum invocations per minute for the instance.</p> <p> <code>NaN</code> indicates that the value is not available.</p>"
28296+
},
28297+
"MemoryUtilization":{
28298+
"shape":"UtilizationMetric",
28299+
"documentation":"<p>The expected memory utilization at maximum invocations per minute for the instance.</p> <p> <code>NaN</code> indicates that the value is not available.</p>"
2826228300
}
2826328301
},
2826428302
"documentation":"<p>The metrics of recommendations.</p>"
@@ -32889,6 +32927,10 @@
3288932927
},
3289032928
"documentation":"<p>A collection of settings that apply to users of Amazon SageMaker Studio. These settings are specified when the <code>CreateUserProfile</code> API is called, and as <code>DefaultUserSettings</code> when the <code>CreateDomain</code> API is called.</p> <p> <code>SecurityGroups</code> is aggregated when specified in both calls. For all other settings in <code>UserSettings</code>, the values specified in <code>CreateUserProfile</code> take precedence over those specified in <code>CreateDomain</code>.</p>"
3289132929
},
32930+
"UtilizationMetric":{
32931+
"type":"float",
32932+
"min":0.0
32933+
},
3289232934
"ValidationFraction":{
3289332935
"type":"float",
3289432936
"max":1,

0 commit comments

Comments
 (0)