Skip to content

Commit 9e7c229

Browse files
author
AWS
committed
Amazon SageMaker Service Update: This release adds support for rolling deployment in SageMaker Inference.
1 parent 3cf3501 commit 9e7c229

File tree

2 files changed

+40
-4
lines changed

2 files changed

+40
-4
lines changed
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
{
2+
"type": "feature",
3+
"category": "Amazon SageMaker Service",
4+
"contributor": "",
5+
"description": "This release adds support for rolling deployment in SageMaker Inference."
6+
}

services/sagemaker/src/main/resources/codegen-resources/service-2.json

Lines changed: 34 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -5853,7 +5853,7 @@
58535853
"documentation":"<p>Defines the capacity size, either as a number of instances or a capacity percentage.</p>"
58545854
}
58555855
},
5856-
"documentation":"<p>Specifies the endpoint capacity to activate for production.</p>"
5856+
"documentation":"<p>Specifies the type and size of the endpoint capacity to activate for a blue/green deployment, a rolling deployment, or a rollback strategy. You can specify your batches as either instance count or the overall percentage or your fleet.</p> <p>For a rollback strategy, if you don't specify the fields in this object, or if you set the <code>Value</code> to 100%, then SageMaker uses a blue/green rollback strategy and rolls all traffic back to the blue fleet.</p>"
58575857
},
58585858
"CapacitySizeType":{
58595859
"type":"string",
@@ -10679,7 +10679,6 @@
1067910679
},
1068010680
"DeploymentConfig":{
1068110681
"type":"structure",
10682-
"required":["BlueGreenUpdatePolicy"],
1068310682
"members":{
1068410683
"BlueGreenUpdatePolicy":{
1068510684
"shape":"BlueGreenUpdatePolicy",
@@ -10688,6 +10687,10 @@
1068810687
"AutoRollbackConfiguration":{
1068910688
"shape":"AutoRollbackConfig",
1069010689
"documentation":"<p>Automatic rollback configuration for handling endpoint deployment failures and recovery.</p>"
10690+
},
10691+
"RollingUpdatePolicy":{
10692+
"shape":"RollingUpdatePolicy",
10693+
"documentation":"<p>Specifies a rolling deployment strategy for updating a SageMaker endpoint.</p>"
1069110694
}
1069210695
},
1069310696
"documentation":"<p>The deployment configuration for an endpoint, which contains the desired deployment strategy and rollback configurations.</p>"
@@ -16050,7 +16053,8 @@
1605016053
"RollingBack",
1605116054
"InService",
1605216055
"Deleting",
16053-
"Failed"
16056+
"Failed",
16057+
"UpdateRollbackFailed"
1605416058
]
1605516059
},
1605616060
"EndpointSummary":{
@@ -23567,7 +23571,7 @@
2356723571
},
2356823572
"MaximumExecutionTimeoutInSeconds":{
2356923573
"type":"integer",
23570-
"max":14400,
23574+
"max":28800,
2357123575
"min":600
2357223576
},
2357323577
"MaximumRetryAttempts":{
@@ -29645,6 +29649,32 @@
2964529649
"min":20,
2964629650
"pattern":"^arn:aws[a-z\\-]*:iam::\\d{12}:role/?[a-zA-Z_0-9+=,.@\\-_/]+$"
2964729651
},
29652+
"RollingUpdatePolicy":{
29653+
"type":"structure",
29654+
"required":[
29655+
"MaximumBatchSize",
29656+
"WaitIntervalInSeconds"
29657+
],
29658+
"members":{
29659+
"MaximumBatchSize":{
29660+
"shape":"CapacitySize",
29661+
"documentation":"<p>Batch size for each rolling step to provision capacity and turn on traffic on the new endpoint fleet, and terminate capacity on the old endpoint fleet. Value must be between 5% to 50% of the variant's total instance count.</p>"
29662+
},
29663+
"WaitIntervalInSeconds":{
29664+
"shape":"WaitIntervalInSeconds",
29665+
"documentation":"<p>The length of the baking period, during which SageMaker monitors alarms for each batch on the new fleet.</p>"
29666+
},
29667+
"MaximumExecutionTimeoutInSeconds":{
29668+
"shape":"MaximumExecutionTimeoutInSeconds",
29669+
"documentation":"<p>The time limit for the total deployment. Exceeding this limit causes a timeout.</p>"
29670+
},
29671+
"RollbackMaximumBatchSize":{
29672+
"shape":"CapacitySize",
29673+
"documentation":"<p>Batch size for rollback to the old endpoint fleet. Each rolling step to provision capacity and turn on traffic on the old endpoint fleet, and terminate capacity on the new endpoint fleet. If this field is absent, the default value will be set to 100% of total capacity which means to bring up the whole capacity of the old fleet at once during rollback.</p>"
29674+
}
29675+
},
29676+
"documentation":"<p>Specifies a rolling deployment strategy for updating a SageMaker endpoint.</p>"
29677+
},
2964829678
"RootAccess":{
2964929679
"type":"string",
2965029680
"enum":[

0 commit comments

Comments
 (0)