aws
diff --git a/‎src/sagemaker/estimator.py
Lines changed: 7 additions & 1 deletion b/‎src/sagemaker/estimator.py
Lines changed: 7 additions & 1 deletion
diff --git a/‎src/sagemaker/image_uri_config/huggingface.json
Lines changed: 68 additions & 1 deletion b/‎src/sagemaker/image_uri_config/huggingface.json
Lines changed: 68 additions & 1 deletion
diff --git a/‎tests/unit/sagemaker/model/test_framework_model.py
Lines changed: 2 additions & 2 deletions b/‎tests/unit/sagemaker/model/test_framework_model.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎tests/unit/sagemaker/tensorflow/test_estimator.py
Lines changed: 2 additions & 2 deletions b/‎tests/unit/sagemaker/tensorflow/test_estimator.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎tests/unit/sagemaker/tensorflow/test_estimator_init.py
Lines changed: 1 addition & 1 deletion b/‎tests/unit/sagemaker/tensorflow/test_estimator_init.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎tests/unit/sagemaker/workflow/test_steps.py
Lines changed: 92 additions & 1 deletion b/‎tests/unit/sagemaker/workflow/test_steps.py
Lines changed: 92 additions & 1 deletion
diff --git a/‎tests/unit/test_amazon_estimator.py
Lines changed: 6 additions & 6 deletions b/‎tests/unit/test_amazon_estimator.py
Lines changed: 6 additions & 6 deletions
diff --git a/‎tests/unit/test_chainer.py
Lines changed: 2 additions & 2 deletions b/‎tests/unit/test_chainer.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎tests/unit/test_estimator.py
Lines changed: 3 additions & 3 deletions b/‎tests/unit/test_estimator.py
Lines changed: 3 additions & 3 deletions
diff --git a/‎tests/unit/test_fm.py
Lines changed: 1 addition & 1 deletion b/‎tests/unit/test_fm.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎tests/unit/test_image.py
Lines changed: 3 additions & 3 deletions b/‎tests/unit/test_image.py
Lines changed: 3 additions & 3 deletions
@@ -2443,7 +2443,13 @@ def attach(cls, training_job_name, sagemaker_session=None, model_channel_name="m
     @staticmethod
     def _json_encode_hyperparameters(hyperparameters):
         """Placeholder docstring"""
-        return {str(k): json.dumps(v) for (k, v) in hyperparameters.items()}
+        current_hyperparameters = hyperparameters
+        if current_hyperparameters is not None:
+            hyperparameters = {
+                str(k): (v if isinstance(v, (Parameter, Expression, Properties)) else json.dumps(v))
+                for (k, v) in current_hyperparameters.items()
+            }
+        return hyperparameters
 
     @classmethod
     def _update_init_params(cls, hp, tf_arguments):
 
@@ -2,7 +2,8 @@
     "training": {
         "processors": ["gpu"],
         "version_aliases": {
-            "4.4": "4.4.2"
+            "4.4": "4.4.2",
+            "4.5": "4.5.0"
         },
         "versions": {
             "4.4.2": {
@@ -70,6 +71,72 @@
                     },
                     "repository": "huggingface-tensorflow-training"
                 }
+            },
+            "4.5.0": {
+                "version_aliases": {
+                    "pytorch1.6": "pytorch1.6.0",
+                    "tensorflow2.4": "tensorflow2.4.1"
+                },
+                "pytorch1.6.0": {
+                    "py_versions": ["py36"],
+                    "registries": {
+                        "af-south-1": "626614931356",
+                        "ap-east-1": "871362719292",
+                        "ap-northeast-1": "763104351884",
+                        "ap-northeast-2": "763104351884",
+                        "ap-south-1": "763104351884",
+                        "ap-southeast-1": "763104351884",
+                        "ap-southeast-2": "763104351884",
+                        "ca-central-1": "763104351884",
+                        "cn-north-1": "727897471807",
+                        "cn-northwest-1": "727897471807",
+                        "eu-central-1": "763104351884",
+                        "eu-north-1": "763104351884",
+                        "eu-west-1": "763104351884",
+                        "eu-west-2": "763104351884",
+                        "eu-west-3": "763104351884",
+                        "eu-south-1": "692866216735",
+                        "me-south-1": "217643126080",
+                        "sa-east-1": "763104351884",
+                        "us-east-1": "763104351884",
+                        "us-east-2": "763104351884",
+                        "us-gov-west-1": "442386744353",
+                        "us-iso-east-1": "886529160074",
+                        "us-west-1": "763104351884",
+                        "us-west-2": "763104351884"
+                    },
+                    "repository": "huggingface-pytorch-training"
+                },
+                "tensorflow2.4.1": {
+                    "py_versions": ["py37"],
+                    "registries": {
+                        "af-south-1": "626614931356",
+                        "ap-east-1": "871362719292",
+                        "ap-northeast-1": "763104351884",
+                        "ap-northeast-2": "763104351884",
+                        "ap-south-1": "763104351884",
+                        "ap-southeast-1": "763104351884",
+                        "ap-southeast-2": "763104351884",
+                        "ca-central-1": "763104351884",
+                        "cn-north-1": "727897471807",
+                        "cn-northwest-1": "727897471807",
+                        "eu-central-1": "763104351884",
+                        "eu-north-1": "763104351884",
+                        "eu-south-1": "692866216735",
+                        "eu-west-1": "763104351884",
+                        "eu-west-2": "763104351884",
+                        "eu-west-3": "763104351884",
+                        "me-south-1": "217643126080",
+                        "sa-east-1": "763104351884",
+                        "us-east-1": "763104351884",
+                        "us-east-2": "763104351884",
+                        "us-gov-west-1": "442386744353",
+                        "us-iso-east-1": "886529160074",
+                        "us-west-1": "763104351884",
+                        "us-west-2": "763104351884"
+                    },
+                    "repository": "huggingface-tensorflow-training"
+                }
             }
         }
     }
 
@@ -56,7 +56,7 @@ def __init__(self, sagemaker_session, **kwargs):
             ROLE,
             ENTRY_POINT,
             sagemaker_session=sagemaker_session,
-            **kwargs
+            **kwargs,
         )
 
     def create_predictor(self, endpoint_name):
@@ -71,7 +71,7 @@ def __init__(self, sagemaker_session, entry_point, **kwargs):
             ROLE,
             entry_point=entry_point,
             sagemaker_session=sagemaker_session,
-            **kwargs
+            **kwargs,
         )
 
     def create_predictor(self, endpoint_name):
 
@@ -159,7 +159,7 @@ def _build_tf(
     py_version=None,
     instance_type=None,
     base_job_name=None,
-    **kwargs
+    **kwargs,
 ):
     return TensorFlow(
         entry_point=SCRIPT_PATH,
@@ -170,7 +170,7 @@ def _build_tf(
         instance_count=INSTANCE_COUNT,
         instance_type=instance_type if instance_type else INSTANCE_TYPE,
         base_job_name=base_job_name,
-        **kwargs
+        **kwargs,
     )
 
 
 
@@ -35,7 +35,7 @@ def _build_tf(sagemaker_session, **kwargs):
         role="dummy-role",
         instance_count=1,
         instance_type="ml.c4.xlarge",
-        **kwargs
+        **kwargs,
     )
 
 
 
@@ -15,6 +15,7 @@
 
 import pytest
 import sagemaker
+import os
 
 from mock import (
     Mock,
@@ -24,6 +25,7 @@
 
 from sagemaker.debugger import ProfilerConfig
 from sagemaker.estimator import Estimator
+from sagemaker.tensorflow import TensorFlow
 from sagemaker.inputs import TrainingInput, TransformInput, CreateModelInput
 from sagemaker.model import Model
 from sagemaker.processing import (
@@ -45,6 +47,10 @@
     CreateModelStep,
     CacheConfig,
 )
+from tests.unit import DATA_DIR
+
+SCRIPT_FILE = "dummy_script.py"
+SCRIPT_PATH = os.path.join(DATA_DIR, SCRIPT_FILE)
 
 REGION = "us-west-2"
 BUCKET = "my-bucket"
@@ -112,7 +118,7 @@ def test_custom_step():
     assert step.to_request() == {"Name": "MyStep", "Type": "Training", "Arguments": dict()}
 
 
-def test_training_step(sagemaker_session):
+def test_training_step_base_estimator(sagemaker_session):
     instance_type_parameter = ParameterString(name="InstanceType", default_value="c4.4xlarge")
     instance_count_parameter = ParameterInteger(name="InstanceCount", default_value=1)
     data_source_uri_parameter = ParameterString(
@@ -177,6 +183,91 @@ def test_training_step(sagemaker_session):
     assert step.properties.TrainingJobName.expr == {"Get": "Steps.MyTrainingStep.TrainingJobName"}
 
 
+def test_training_step_tensorflow(sagemaker_session):
+    instance_type_parameter = ParameterString(name="InstanceType", default_value="ml.p3.16xlarge")
+    instance_count_parameter = ParameterInteger(name="InstanceCount", default_value=1)
+    data_source_uri_parameter = ParameterString(
+        name="DataSourceS3Uri", default_value=f"s3://{BUCKET}/train_manifest"
+    )
+    training_epochs_parameter = ParameterInteger(name="TrainingEpochs", default_value=5)
+    training_batch_size_parameter = ParameterInteger(name="TrainingBatchSize", default_value=500)
+    estimator = TensorFlow(
+        entry_point=os.path.join(DATA_DIR, SCRIPT_FILE),
+        role=ROLE,
+        model_dir=False,
+        image_uri=IMAGE_URI,
+        source_dir="s3://mybucket/source",
+        framework_version="2.4.1",
+        py_version="py37",
+        instance_count=instance_count_parameter,
+        instance_type=instance_type_parameter,
+        sagemaker_session=sagemaker_session,
+        # subnets=subnets,
+        hyperparameters={
+            "batch-size": training_batch_size_parameter,
+            "epochs": training_epochs_parameter,
+        },
+        # security_group_ids=security_group_ids,
+        debugger_hook_config=False,
+        # Training using SMDataParallel Distributed Training Framework
+        distribution={"smdistributed": {"dataparallel": {"enabled": True}}},
+    )
+
+    inputs = TrainingInput(s3_data=data_source_uri_parameter)
+    cache_config = CacheConfig(enable_caching=True, expire_after="PT1H")
+    step = TrainingStep(
+        name="MyTrainingStep", estimator=estimator, inputs=inputs, cache_config=cache_config
+    )
+    step_request = step.to_request()
+    step_request["Arguments"]["HyperParameters"].pop("sagemaker_job_name", None)
+    step_request["Arguments"]["HyperParameters"].pop("sagemaker_program", None)
+    step_request["Arguments"].pop("ProfilerRuleConfigurations", None)
+    assert step_request == {
+        "Name": "MyTrainingStep",
+        "Type": "Training",
+        "Arguments": {
+            "AlgorithmSpecification": {
+                "TrainingInputMode": "File",
+                "TrainingImage": "fakeimage",
+                "EnableSageMakerMetricsTimeSeries": True,
+            },
+            "OutputDataConfig": {"S3OutputPath": "s3://my-bucket/"},
+            "StoppingCondition": {"MaxRuntimeInSeconds": 86400},
+            "ResourceConfig": {
+                "InstanceCount": instance_count_parameter,
+                "InstanceType": instance_type_parameter,
+                "VolumeSizeInGB": 30,
+            },
+            "RoleArn": "DummyRole",
+            "InputDataConfig": [
+                {
+                    "DataSource": {
+                        "S3DataSource": {
+                            "S3DataType": "S3Prefix",
+                            "S3Uri": data_source_uri_parameter,
+                            "S3DataDistributionType": "FullyReplicated",
+                        }
+                    },
+                    "ChannelName": "training",
+                }
+            ],
+            "HyperParameters": {
+                "batch-size": training_batch_size_parameter,
+                "epochs": training_epochs_parameter,
+                "sagemaker_submit_directory": '"s3://mybucket/source"',
+                "sagemaker_container_log_level": "20",
+                "sagemaker_region": '"us-west-2"',
+                "sagemaker_distributed_dataparallel_enabled": "true",
+                "sagemaker_instance_type": instance_type_parameter,
+                "sagemaker_distributed_dataparallel_custom_mpi_options": '""',
+            },
+            "ProfilerConfig": {"S3OutputPath": "s3://my-bucket/"},
+        },
+        "CacheConfig": {"Enabled": True, "ExpireAfter": "PT1H"},
+    }
+    assert step.properties.TrainingJobName.expr == {"Get": "Steps.MyTrainingStep.TrainingJobName"}
+
+
 def test_processing_step(sagemaker_session):
     processing_input_data_uri_parameter = ParameterString(
         name="ProcessingInputDataUri", default_value=f"s3://{BUCKET}/processing_manifest"
 
@@ -86,7 +86,7 @@ def test_init_enable_network_isolation(sagemaker_session):
         num_components=55,
         sagemaker_session=sagemaker_session,
         enable_network_isolation=True,
-        **COMMON_ARGS
+        **COMMON_ARGS,
     )
     assert pca.num_components == 55
     assert pca.enable_network_isolation() is True
@@ -99,7 +99,7 @@ def test_init_all_pca_hyperparameters(sagemaker_session):
         subtract_mean=True,
         extra_components=33,
         sagemaker_session=sagemaker_session,
-        **COMMON_ARGS
+        **COMMON_ARGS,
     )
     assert pca.num_components == 55
     assert pca.algorithm_mode == "randomized"
@@ -112,7 +112,7 @@ def test_init_estimator_args(sagemaker_session):
         max_run=1234,
         sagemaker_session=sagemaker_session,
         data_location="s3://some-bucket/some-key/",
-        **COMMON_ARGS
+        **COMMON_ARGS,
     )
     assert pca.instance_type == COMMON_ARGS["instance_type"]
     assert pca.instance_count == COMMON_ARGS["instance_count"]
@@ -133,7 +133,7 @@ def test_data_location_does_not_call_default_bucket(sagemaker_session):
         num_components=2,
         sagemaker_session=sagemaker_session,
         data_location=data_location,
-        **COMMON_ARGS
+        **COMMON_ARGS,
     )
     assert pca.data_location == data_location
     assert not sagemaker_session.default_bucket.called
@@ -205,7 +205,7 @@ def test_fit_ndarray(time, sagemaker_session):
         num_components=55,
         sagemaker_session=sagemaker_session,
         data_location="s3://{}/key-prefix/".format(BUCKET_NAME),
-        **kwargs
+        **kwargs,
     )
     train = [[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 8.0], [44.0, 55.0, 66.0]]
     labels = [99, 85, 87, 2]
@@ -233,7 +233,7 @@ def test_fit_pass_experiment_config(sagemaker_session):
         num_components=55,
         sagemaker_session=sagemaker_session,
         data_location="s3://{}/key-prefix/".format(BUCKET_NAME),
-        **kwargs
+        **kwargs,
     )
     train = [[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 8.0], [44.0, 55.0, 66.0]]
     labels = [99, 85, 87, 2]
 
@@ -88,7 +88,7 @@ def _chainer_estimator(
     num_processes=None,
     process_slots_per_host=None,
     additional_mpi_options=None,
-    **kwargs
+    **kwargs,
 ):
     return Chainer(
         entry_point=SCRIPT_PATH,
@@ -103,7 +103,7 @@ def _chainer_estimator(
         num_processes=num_processes,
         process_slots_per_host=process_slots_per_host,
         additional_mpi_options=additional_mpi_options,
-        **kwargs
+        **kwargs,
     )
 
 
 
@@ -140,7 +140,7 @@ def create_model(
         vpc_config_override=vpc_utils.VPC_CONFIG_DEFAULT,
         enable_network_isolation=None,
         model_dir=None,
-        **kwargs
+        **kwargs,
     ):
         if enable_network_isolation is None:
             enable_network_isolation = self.enable_network_isolation()
@@ -151,7 +151,7 @@ def create_model(
             entry_point=entry_point,
             enable_network_isolation=enable_network_isolation,
             role=role,
-            **kwargs
+            **kwargs,
         )
 
     @classmethod
@@ -171,7 +171,7 @@ def __init__(self, sagemaker_session, entry_point=None, role=ROLE, **kwargs):
             role,
             entry_point or ENTRY_POINT,
             sagemaker_session=sagemaker_session,
-            **kwargs
+            **kwargs,
         )
 
     def create_predictor(self, endpoint_name):
 
@@ -115,7 +115,7 @@ def test_all_hyperparameters(sagemaker_session):
         factors_init_scale=1.101,
         factors_init_sigma=1.202,
         factors_init_value=1.303,
-        **ALL_REQ_ARGS
+        **ALL_REQ_ARGS,
     )
     assert fm.hyperparameters() == dict(
         num_factors=str(ALL_REQ_ARGS["num_factors"]),
 
@@ -751,10 +751,10 @@ def test_ecr_login_needed(check_output):
     token_response = "AWS:%s" % token
     b64_token = base64.b64encode(token_response.encode("utf-8"))
     response = {
-        u"authorizationData": [
+        "authorizationData": [
             {
-                u"authorizationToken": b64_token,
-                u"proxyEndpoint": u"https://520713654638.dkr.ecr.us-east-1.amazonaws.com",
+                "authorizationToken": b64_token,
+                "proxyEndpoint": "https://520713654638.dkr.ecr.us-east-1.amazonaws.com",
             }
         ],
         "ResponseMetadata": {
Original file line number	Diff line number	Diff line change
`@@ -35,7 +35,7 @@ def _build_tf(sagemaker_session, **kwargs):`
`35`	`35`	`role="dummy-role",`
`36`	`36`	`instance_count=1,`
`37`	`37`	`instance_type="ml.c4.xlarge",`
`38`		`- **kwargs`
	`38`	`+ **kwargs,`
`39`	`39`	`)`
`40`	`40`
`41`	`41`
Original file line number	Diff line number	Diff line change
`@@ -115,7 +115,7 @@ def test_all_hyperparameters(sagemaker_session):`
`115`	`115`	`factors_init_scale=1.101,`
`116`	`116`	`factors_init_sigma=1.202,`
`117`	`117`	`factors_init_value=1.303,`
`118`		`- **ALL_REQ_ARGS`
	`118`	`+ **ALL_REQ_ARGS,`
`119`	`119`	`)`
`120`	`120`	`assert fm.hyperparameters() == dict(`
`121`	`121`	`num_factors=str(ALL_REQ_ARGS["num_factors"]),`
Original file line number	Diff line number	Diff line change
`@@ -751,10 +751,10 @@ def test_ecr_login_needed(check_output):`
`751`	`751`	`token_response = "AWS:%s" % token`
`752`	`752`	`b64_token = base64.b64encode(token_response.encode("utf-8"))`
`753`	`753`	`response = {`
`754`		`- u"authorizationData": [`
	`754`	`+ "authorizationData": [`
`755`	`755`	`{`
`756`		`- u"authorizationToken": b64_token,`
`757`		`- u"proxyEndpoint": u"https://520713654638.dkr.ecr.us-east-1.amazonaws.com",`
	`756`	`+ "authorizationToken": b64_token,`
	`757`	`+ "proxyEndpoint": "https://520713654638.dkr.ecr.us-east-1.amazonaws.com",`
`758`	`758`	`}`
`759`	`759`	`],`
`760`	`760`	`"ResponseMetadata": {`