feat(client-sagemaker): SageMaker Training Managed Warm Pools let you retain provisioned infrastructure to reduce latency for repetitive training workloads.

awstools · awstools · commit 85fc637e3066 · 2022-09-29T18:26:24.000Z
diff --git a/clients/client-sagemaker/src/SageMaker.ts b/clients/client-sagemaker/src/SageMaker.ts
@@ -10233,7 +10233,7 @@ export class SageMaker extends SageMakerClient {
   }
 
   /**
-   * <p>Update a model training job to request a new Debugger profiling configuration.</p>
+   * <p>Update a model training job to request a new Debugger profiling configuration or to change warm pool retention length.</p>
    */
   public updateTrainingJob(
     args: UpdateTrainingJobCommandInput,
diff --git a/clients/client-sagemaker/src/commands/ListMonitoringSchedulesCommand.ts b/clients/client-sagemaker/src/commands/ListMonitoringSchedulesCommand.ts
@@ -12,12 +12,8 @@ import {
   SerdeContext as __SerdeContext,
 } from "@aws-sdk/types";
 
-import {
-  ListMonitoringSchedulesRequest,
-  ListMonitoringSchedulesRequestFilterSensitiveLog,
-  ListMonitoringSchedulesResponse,
-  ListMonitoringSchedulesResponseFilterSensitiveLog,
-} from "../models/models_2";
+import { ListMonitoringSchedulesRequest, ListMonitoringSchedulesRequestFilterSensitiveLog } from "../models/models_2";
+import { ListMonitoringSchedulesResponse, ListMonitoringSchedulesResponseFilterSensitiveLog } from "../models/models_3";
 import {
   deserializeAws_json1_1ListMonitoringSchedulesCommand,
   serializeAws_json1_1ListMonitoringSchedulesCommand,
diff --git a/clients/client-sagemaker/src/commands/UpdateTrainingJobCommand.ts b/clients/client-sagemaker/src/commands/UpdateTrainingJobCommand.ts
@@ -28,7 +28,7 @@ export interface UpdateTrainingJobCommandInput extends UpdateTrainingJobRequest
 export interface UpdateTrainingJobCommandOutput extends UpdateTrainingJobResponse, __MetadataBearer {}
 
 /**
- * <p>Update a model training job to request a new Debugger profiling configuration.</p>
+ * <p>Update a model training job to request a new Debugger profiling configuration or to change warm pool retention length.</p>
  * @example
  * Use a bare-bones client and the command you need to make an API call.
  * ```javascript
diff --git a/clients/client-sagemaker/src/models/models_0.ts b/clients/client-sagemaker/src/models/models_0.ts
@@ -1215,6 +1215,11 @@ export interface ResourceConfig {
    * <p>The configuration of a heterogeneous cluster in JSON format.</p>
    */
   InstanceGroups?: InstanceGroup[];
+
+  /**
+   * <p>The duration of time in seconds to retain configured resources in a warm pool for subsequent training jobs.</p>
+   */
+  KeepAlivePeriodInSeconds?: number;
 }
 
 /**
diff --git a/clients/client-sagemaker/src/models/models_2.ts b/clients/client-sagemaker/src/models/models_2.ts
@@ -3020,6 +3020,56 @@ export interface SecondaryStatusTransition {
   StatusMessage?: string;
 }
 
+export enum WarmPoolResourceStatus {
+  AVAILABLE = "Available",
+  INUSE = "InUse",
+  REUSED = "Reused",
+  TERMINATED = "Terminated",
+}
+
+/**
+ * <p>Status and billing information about the warm pool.</p>
+ */
+export interface WarmPoolStatus {
+  /**
+   * <p>The status of the warm pool.</p>
+   *         <ul>
+   *             <li>
+   *                 <p>
+   *                   <code>InUse</code>: The warm pool is in use for the training job.</p>
+   *             </li>
+   *             <li>
+   *                 <p>
+   *                   <code>Available</code>: The warm pool is available to reuse for a matching training job.</p>
+   *             </li>
+   *             <li>
+   *                 <p>
+   *                   <code>Reused</code>: The warm pool moved to a matching training job for reuse.</p>
+   *             </li>
+   *             <li>
+   *                 <p>
+   *                   <code>Terminated</code>: The warm pool is no longer available. Warm pools are unavailable if they are terminated by a user, terminated for a patch update, or terminated for exceeding the specified <code>KeepAlivePeriodInSeconds</code>.</p>
+   *             </li>
+   *          </ul>
+   */
+  Status: WarmPoolResourceStatus | string | undefined;
+
+  /**
+   * <p>The billable time in seconds used by the warm pool. Billable time refers to the absolute wall-clock
+   *             time.</p>
+   *         <p>Multiply <code>ResourceRetainedBillableTimeInSeconds</code> by the number of instances
+   *             (<code>InstanceCount</code>) in your training cluster to get the total compute time
+   *             SageMaker bills you if you run warm pool training. The formula is as follows:
+   *             <code>ResourceRetainedBillableTimeInSeconds * InstanceCount</code>.</p>
+   */
+  ResourceRetainedBillableTimeInSeconds?: number;
+
+  /**
+   * <p>The name of the matching training job that reused the warm pool.</p>
+   */
+  ReusedByJob?: string;
+}
+
 export interface DescribeTrainingJobResponse {
   /**
    * <p> Name of the model training job. </p>
@@ -3420,6 +3470,11 @@ export interface DescribeTrainingJobResponse {
    * <p>The environment variables to set in the Docker container.</p>
    */
   Environment?: Record<string, string>;
+
+  /**
+   * <p>The status of the warm pool associated with the training job.</p>
+   */
+  WarmPoolStatus?: WarmPoolStatus;
 }
 
 export interface DescribeTransformJobRequest {
@@ -8911,25 +8966,6 @@ export interface MonitoringScheduleSummary {
   MonitoringType?: MonitoringType | string;
 }
 
-export interface ListMonitoringSchedulesResponse {
-  /**
-   * <p>A JSON array in which each element is a summary for a monitoring schedule.</p>
-   */
-  MonitoringScheduleSummaries: MonitoringScheduleSummary[] | undefined;
-
-  /**
-   * <p>If the response is truncated, Amazon SageMaker returns this token. To retrieve the next set of jobs,
-   *          use it in the subsequent request.</p>
-   */
-  NextToken?: string;
-}
-
-export enum NotebookInstanceLifecycleConfigSortKey {
-  CREATION_TIME = "CreationTime",
-  LAST_MODIFIED_TIME = "LastModifiedTime",
-  NAME = "Name",
-}
-
 /**
  * @internal
  */
@@ -9491,6 +9527,13 @@ export const SecondaryStatusTransitionFilterSensitiveLog = (obj: SecondaryStatus
   ...obj,
 });
 
+/**
+ * @internal
+ */
+export const WarmPoolStatusFilterSensitiveLog = (obj: WarmPoolStatus): any => ({
+  ...obj,
+});
+
 /**
  * @internal
  */
@@ -10680,10 +10723,3 @@ export const ListMonitoringSchedulesRequestFilterSensitiveLog = (obj: ListMonito
 export const MonitoringScheduleSummaryFilterSensitiveLog = (obj: MonitoringScheduleSummary): any => ({
   ...obj,
 });
-
-/**
- * @internal
- */
-export const ListMonitoringSchedulesResponseFilterSensitiveLog = (obj: ListMonitoringSchedulesResponse): any => ({
-  ...obj,
-});
diff --git a/clients/client-sagemaker/src/models/models_3.ts b/clients/client-sagemaker/src/models/models_3.ts
@@ -98,7 +98,7 @@ import {
   MetricData,
   ModelPackageGroupStatus,
   ModelPackageStatusDetails,
-  NotebookInstanceLifecycleConfigSortKey,
+  MonitoringScheduleSummary,
   NotebookInstanceStatus,
   PipelineExecutionStatus,
   PipelineExperimentConfig,
@@ -118,10 +118,31 @@ import {
   TrialComponentSource,
   TrialSource,
   UserProfileStatus,
+  WarmPoolResourceStatus,
+  WarmPoolStatus,
   Workforce,
   Workteam,
 } from "./models_2";
 
+export interface ListMonitoringSchedulesResponse {
+  /**
+   * <p>A JSON array in which each element is a summary for a monitoring schedule.</p>
+   */
+  MonitoringScheduleSummaries: MonitoringScheduleSummary[] | undefined;
+
+  /**
+   * <p>If the response is truncated, Amazon SageMaker returns this token. To retrieve the next set of jobs,
+   *          use it in the subsequent request.</p>
+   */
+  NextToken?: string;
+}
+
+export enum NotebookInstanceLifecycleConfigSortKey {
+  CREATION_TIME = "CreationTime",
+  LAST_MODIFIED_TIME = "LastModifiedTime",
+  NAME = "Name",
+}
+
 export enum NotebookInstanceLifecycleConfigSortOrder {
   ASCENDING = "Ascending",
   DESCENDING = "Descending",
@@ -1479,6 +1500,11 @@ export interface ListTrainingJobsRequest {
    * <p>The sort order for results. The default is <code>Ascending</code>.</p>
    */
   SortOrder?: SortOrder | string;
+
+  /**
+   * <p>A filter that retrieves only training jobs with a specific warm pool status.</p>
+   */
+  WarmPoolStatusEquals?: WarmPoolResourceStatus | string;
 }
 
 /**
@@ -1516,6 +1542,11 @@ export interface TrainingJobSummary {
    * <p>The status of the training job.</p>
    */
   TrainingJobStatus: TrainingJobStatus | string | undefined;
+
+  /**
+   * <p>The status of the warm pool associated with the training job.</p>
+   */
+  WarmPoolStatus?: WarmPoolStatus;
 }
 
 export interface ListTrainingJobsResponse {
@@ -3066,6 +3097,16 @@ export interface RenderUiTemplateResponse {
   Errors: RenderingError[] | undefined;
 }
 
+/**
+ * <p>The <code>ResourceConfig</code> to update <code>KeepAlivePeriodInSeconds</code>. Other fields in the <code>ResourceConfig</code> cannot be updated.</p>
+ */
+export interface ResourceConfigForUpdate {
+  /**
+   * <p>The <code>KeepAlivePeriodInSeconds</code> value specified in the <code>ResourceConfig</code> to update.</p>
+   */
+  KeepAlivePeriodInSeconds: number | undefined;
+}
+
 export interface RetryPipelineExecutionRequest {
   /**
    * <p>The Amazon Resource Name (ARN) of the pipeline execution.</p>
@@ -4960,6 +5001,11 @@ export interface UpdateTrainingJobRequest {
    *             metrics.</p>
    */
   ProfilerRuleConfigurations?: ProfilerRuleConfiguration[];
+
+  /**
+   * <p>The training job <code>ResourceConfig</code> to update warm pool retention length.</p>
+   */
+  ResourceConfig?: ResourceConfigForUpdate;
 }
 
 export interface UpdateTrainingJobResponse {
@@ -5256,6 +5302,13 @@ export interface SearchRequest {
   MaxResults?: number;
 }
 
+/**
+ * @internal
+ */
+export const ListMonitoringSchedulesResponseFilterSensitiveLog = (obj: ListMonitoringSchedulesResponse): any => ({
+  ...obj,
+});
+
 /**
  * @internal
  */
@@ -5844,6 +5897,13 @@ export const RenderUiTemplateResponseFilterSensitiveLog = (obj: RenderUiTemplate
   ...obj,
 });
 
+/**
+ * @internal
+ */
+export const ResourceConfigForUpdateFilterSensitiveLog = (obj: ResourceConfigForUpdate): any => ({
+  ...obj,
+});
+
 /**
  * @internal
  */
diff --git a/clients/client-sagemaker/src/protocols/Aws_json1_1.ts b/clients/client-sagemaker/src/protocols/Aws_json1_1.ts
@@ -1392,7 +1392,6 @@ import {
   ListMonitoringExecutionsRequest,
   ListMonitoringExecutionsResponse,
   ListMonitoringSchedulesRequest,
-  ListMonitoringSchedulesResponse,
   MetricData,
   ModelConfiguration,
   ModelMetadataFilter,
@@ -1425,11 +1424,13 @@ import {
   TrialComponentSource,
   TrialSource,
   UiTemplateInfo,
+  WarmPoolStatus,
   Workforce,
   WorkforceVpcConfigResponse,
   Workteam,
 } from "../models/models_2";
 import {
+  ListMonitoringSchedulesResponse,
   ListNotebookInstanceLifecycleConfigsInput,
   ListNotebookInstanceLifecycleConfigsOutput,
   ListNotebookInstancesInput,
@@ -1502,6 +1503,7 @@ import {
   RenderingError,
   RenderUiTemplateRequest,
   RenderUiTemplateResponse,
+  ResourceConfigForUpdate,
   RetryPipelineExecutionRequest,
   RetryPipelineExecutionResponse,
   SearchExpression,
@@ -20136,6 +20138,7 @@ const serializeAws_json1_1ListTrainingJobsRequest = (input: ListTrainingJobsRequ
     ...(input.SortBy != null && { SortBy: input.SortBy }),
     ...(input.SortOrder != null && { SortOrder: input.SortOrder }),
     ...(input.StatusEquals != null && { StatusEquals: input.StatusEquals }),
+    ...(input.WarmPoolStatusEquals != null && { WarmPoolStatusEquals: input.WarmPoolStatusEquals }),
   };
 };
 
@@ -21598,11 +21601,18 @@ const serializeAws_json1_1ResourceConfig = (input: ResourceConfig, context: __Se
       InstanceGroups: serializeAws_json1_1InstanceGroups(input.InstanceGroups, context),
     }),
     ...(input.InstanceType != null && { InstanceType: input.InstanceType }),
+    ...(input.KeepAlivePeriodInSeconds != null && { KeepAlivePeriodInSeconds: input.KeepAlivePeriodInSeconds }),
     ...(input.VolumeKmsKeyId != null && { VolumeKmsKeyId: input.VolumeKmsKeyId }),
     ...(input.VolumeSizeInGB != null && { VolumeSizeInGB: input.VolumeSizeInGB }),
   };
 };
 
+const serializeAws_json1_1ResourceConfigForUpdate = (input: ResourceConfigForUpdate, context: __SerdeContext): any => {
+  return {
+    ...(input.KeepAlivePeriodInSeconds != null && { KeepAlivePeriodInSeconds: input.KeepAlivePeriodInSeconds }),
+  };
+};
+
 const serializeAws_json1_1ResourceLimits = (input: ResourceLimits, context: __SerdeContext): any => {
   return {
     ...(input.MaxNumberOfTrainingJobs != null && { MaxNumberOfTrainingJobs: input.MaxNumberOfTrainingJobs }),
@@ -22717,6 +22727,9 @@ const serializeAws_json1_1UpdateTrainingJobRequest = (
         context
       ),
     }),
+    ...(input.ResourceConfig != null && {
+      ResourceConfig: serializeAws_json1_1ResourceConfigForUpdate(input.ResourceConfig, context),
+    }),
     ...(input.TrainingJobName != null && { TrainingJobName: input.TrainingJobName }),
   };
 };
@@ -26646,6 +26659,8 @@ const deserializeAws_json1_1DescribeTrainingJobResponse = (
     TrainingTimeInSeconds: __expectInt32(output.TrainingTimeInSeconds),
     TuningJobArn: __expectString(output.TuningJobArn),
     VpcConfig: output.VpcConfig != null ? deserializeAws_json1_1VpcConfig(output.VpcConfig, context) : undefined,
+    WarmPoolStatus:
+      output.WarmPoolStatus != null ? deserializeAws_json1_1WarmPoolStatus(output.WarmPoolStatus, context) : undefined,
   } as any;
 };
 
@@ -32300,6 +32315,7 @@ const deserializeAws_json1_1ResourceConfig = (output: any, context: __SerdeConte
     InstanceGroups:
       output.InstanceGroups != null ? deserializeAws_json1_1InstanceGroups(output.InstanceGroups, context) : undefined,
     InstanceType: __expectString(output.InstanceType),
+    KeepAlivePeriodInSeconds: __expectInt32(output.KeepAlivePeriodInSeconds),
     VolumeKmsKeyId: __expectString(output.VolumeKmsKeyId),
     VolumeSizeInGB: __expectInt32(output.VolumeSizeInGB),
   } as any;
@@ -33009,6 +33025,8 @@ const deserializeAws_json1_1TrainingJobSummary = (output: any, context: __SerdeC
     TrainingJobArn: __expectString(output.TrainingJobArn),
     TrainingJobName: __expectString(output.TrainingJobName),
     TrainingJobStatus: __expectString(output.TrainingJobStatus),
+    WarmPoolStatus:
+      output.WarmPoolStatus != null ? deserializeAws_json1_1WarmPoolStatus(output.WarmPoolStatus, context) : undefined,
   } as any;
 };
 
@@ -33873,6 +33891,14 @@ const deserializeAws_json1_1VpcSecurityGroupIds = (output: any, context: __Serde
   return retVal;
 };
 
+const deserializeAws_json1_1WarmPoolStatus = (output: any, context: __SerdeContext): WarmPoolStatus => {
+  return {
+    ResourceRetainedBillableTimeInSeconds: __expectInt32(output.ResourceRetainedBillableTimeInSeconds),
+    ReusedByJob: __expectString(output.ReusedByJob),
+    Status: __expectString(output.Status),
+  } as any;
+};
+
 const deserializeAws_json1_1Workforce = (output: any, context: __SerdeContext): Workforce => {
   return {
     CognitoConfig:
diff --git a/codegen/sdk-codegen/aws-models/sagemaker.json b/codegen/sdk-codegen/aws-models/sagemaker.json

Original file line number	Diff line number	Diff line change
`@@ -10233,7 +10233,7 @@ export class SageMaker extends SageMakerClient {`
`10233`	`10233`	`}`
`10234`	`10234`
`10235`	`10235`	`/**`
`10236`		`- * <p>Update a model training job to request a new Debugger profiling configuration.</p>`
	`10236`	`+ * <p>Update a model training job to request a new Debugger profiling configuration or to change warm pool retention length.</p>`
`10237`	`10237`	`*/`
`10238`	`10238`	`public updateTrainingJob(`
`10239`	`10239`	`args: UpdateTrainingJobCommandInput,`