Skip to content

Commit 7e0febc

Browse files
author
AWS
committed
Amazon SageMaker Service Update: This release includes support for (1) Provisioned Concurrency for Amazon SageMaker Serverless Inference and (2) UpdateEndpointWeightsAndCapacities API for Serverless endpoints.
1 parent 85c6b61 commit 7e0febc

File tree

2 files changed

+36
-3
lines changed

2 files changed

+36
-3
lines changed
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
{
2+
"type": "feature",
3+
"category": "Amazon SageMaker Service",
4+
"contributor": "",
5+
"description": "This release includes support for (1) Provisioned Concurrency for Amazon SageMaker Serverless Inference and (2) UpdateEndpointWeightsAndCapacities API for Serverless endpoints."
6+
}

services/sagemaker/src/main/resources/codegen-resources/service-2.json

Lines changed: 30 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -7475,7 +7475,7 @@
74757475
},
74767476
"AppSecurityGroupManagement":{
74777477
"shape":"AppSecurityGroupManagement",
7478-
"documentation":"<p>The entity that creates and manages the required security groups for inter-app communication in <code>VPCOnly</code> mode. Required when <code>CreateDomain.AppNetworkAccessType</code> is <code>VPCOnly</code> and <code>DomainSettings.RStudioServerProDomainSettings.DomainExecutionRoleArn</code> is provided.</p>"
7478+
"documentation":"<p>The entity that creates and manages the required security groups for inter-app communication in <code>VPCOnly</code> mode. Required when <code>CreateDomain.AppNetworkAccessType</code> is <code>VPCOnly</code> and <code>DomainSettings.RStudioServerProDomainSettings.DomainExecutionRoleArn</code> is provided. If setting up the domain for use with RStudio, this value must be set to <code>Service</code>.</p>"
74797479
},
74807480
"DomainSettings":{
74817481
"shape":"DomainSettings",
@@ -14615,6 +14615,10 @@
1461514615
"DesiredInstanceCount":{
1461614616
"shape":"TaskCount",
1461714617
"documentation":"<p>The variant's capacity.</p>"
14618+
},
14619+
"ServerlessUpdateConfig":{
14620+
"shape":"ProductionVariantServerlessUpdateConfig",
14621+
"documentation":"<p>Specifies the serverless update concurrency configuration for an endpoint variant.</p>"
1461814622
}
1461914623
},
1462014624
"documentation":"<p>Specifies weight and capacity values for a production variant.</p>"
@@ -15059,7 +15063,7 @@
1505915063
"members":{
1506015064
"RStudioServerProDomainSettingsForUpdate":{
1506115065
"shape":"RStudioServerProDomainSettingsForUpdate",
15062-
"documentation":"<p>A collection of <code>RStudioServerPro</code> Domain-level app settings to update.</p>"
15066+
"documentation":"<p>A collection of <code>RStudioServerPro</code> Domain-level app settings to update. A single <code>RStudioServerPro</code> application is created for a domain.</p>"
1506315067
},
1506415068
"ExecutionRoleIdentityConfig":{
1506515069
"shape":"ExecutionRoleIdentityConfig",
@@ -27755,10 +27759,28 @@
2775527759
"MaxConcurrency":{
2775627760
"shape":"ServerlessMaxConcurrency",
2775727761
"documentation":"<p>The maximum number of concurrent invocations your serverless endpoint can process.</p>"
27762+
},
27763+
"ProvisionedConcurrency":{
27764+
"shape":"ServerlessProvisionedConcurrency",
27765+
"documentation":"<p>The amount of provisioned concurrency to allocate for the serverless endpoint. Should be less than or equal to <code>MaxConcurrency</code>.</p>"
2775827766
}
2775927767
},
2776027768
"documentation":"<p>Specifies the serverless configuration for an endpoint variant.</p>"
2776127769
},
27770+
"ProductionVariantServerlessUpdateConfig":{
27771+
"type":"structure",
27772+
"members":{
27773+
"MaxConcurrency":{
27774+
"shape":"ServerlessMaxConcurrency",
27775+
"documentation":"<p>The updated maximum number of concurrent invocations your serverless endpoint can process.</p>"
27776+
},
27777+
"ProvisionedConcurrency":{
27778+
"shape":"ServerlessProvisionedConcurrency",
27779+
"documentation":"<p>The updated amount of provisioned concurrency to allocate for the serverless endpoint. Should be less than or equal to <code>MaxConcurrency</code>.</p>"
27780+
}
27781+
},
27782+
"documentation":"<p>Specifies the serverless update concurrency configuration for an endpoint variant.</p>"
27783+
},
2776227784
"ProductionVariantStatus":{
2776327785
"type":"structure",
2776427786
"required":["Status"],
@@ -29661,6 +29683,11 @@
2966129683
"max":6144,
2966229684
"min":1024
2966329685
},
29686+
"ServerlessProvisionedConcurrency":{
29687+
"type":"integer",
29688+
"max":200,
29689+
"min":1
29690+
},
2966429691
"ServiceCatalogEntityId":{
2966529692
"type":"string",
2966629693
"max":100,
@@ -32450,7 +32477,7 @@
3245032477
},
3245132478
"AppSecurityGroupManagement":{
3245232479
"shape":"AppSecurityGroupManagement",
32453-
"documentation":"<p>The entity that creates and manages the required security groups for inter-app communication in <code>VPCOnly</code> mode. Required when <code>CreateDomain.AppNetworkAccessType</code> is <code>VPCOnly</code> and <code>DomainSettings.RStudioServerProDomainSettings.DomainExecutionRoleArn</code> is provided.</p>"
32480+
"documentation":"<p>The entity that creates and manages the required security groups for inter-app communication in <code>VPCOnly</code> mode. Required when <code>CreateDomain.AppNetworkAccessType</code> is <code>VPCOnly</code> and <code>DomainSettings.RStudioServerProDomainSettings.DomainExecutionRoleArn</code> is provided. If setting up the domain for use with RStudio, this value must be set to <code>Service</code>.</p>"
3245432481
}
3245532482
}
3245632483
},

0 commit comments

Comments
 (0)