aws · chuyang-deng · Mar 4, 2019 · Feb 25, 2019 · Feb 25, 2019 · Feb 28, 2019
diff --git a/README.md b/README.md
@@ -110,7 +110,7 @@ tox
 
 To test Elastic Inference with Accelerator, you will need an AWS account, publish your built image to ECR repository and run the following command:
 
-    pytest test/functional/test_elastic_inference.py --aws-id <aws_account> \
+    pytest test/sagemaker/test_elastic_inference.py --aws-id <aws_account> \
                                                       --docker-base-name <ECR_repository_name> \
                                                       --instance-type <instance_type> \
                                                       --accelerator-type <accelerator_type> \

diff --git a/docker/Dockerfile.ei b/docker/Dockerfile.ei
@@ -3,7 +3,7 @@ LABEL com.amazonaws.sagemaker.capabilities.accept-bind-to-port=true
 
 ARG TFS_SHORT_VERSION
 
-COPY AmazonEI_Tensorflow_Serving_v${TFS_SHORT_VERSION}_v1 /usr/bin/tensorflow_model_server
+COPY AmazonEI_TensorFlow_Serving_v${TFS_SHORT_VERSION}_v1 /usr/bin/tensorflow_model_server
 
 # downloaded 1.12 version is not executable
 RUN chmod +x /usr/bin/tensorflow_model_server
@@ -19,7 +19,7 @@ RUN \
     apt-get clean
 
 COPY ./ /
-RUN rm AmazonEI_Tensorflow_Serving_v${TFS_SHORT_VERSION}_v1
+RUN rm AmazonEI_TensorFlow_Serving_v${TFS_SHORT_VERSION}_v1
 
 ENV SAGEMAKER_TFS_VERSION "${TFS_SHORT_VERSION}"
 ENV PATH "$PATH:/sagemaker"
diff --git a/scripts/shared.sh b/scripts/shared.sh
@@ -29,18 +29,14 @@ function get_aws_account() {
 }
 
 function get_tfs_executable() {
-    # default to v1.12 in accordance with defaults below
-    s3_object='tfs_ei_v1_12_ubuntu'
-    unzipped='v1_12_Ubuntu'
+    zip_file=$(aws s3 ls 's3://amazonei-tensorflow/Tensorflow Serving/v'${version}'/Ubuntu/' | awk '{print $4}')
+    aws s3 cp 's3://amazonei-tensorflow/Tensorflow Serving/v'${version}'/Ubuntu/'${zip_file} .
 
-    if [ ${version} = '1.11' ]; then
-        s3_object='Ubuntu'
-        unzipped='Ubuntu'
-    fi
+    mkdir exec_dir
+    unzip ${zip_file} -d exec_dir
 
-    aws s3 cp 's3://amazonei-tensorflow/Tensorflow Serving/v'${version}'/Ubuntu/'${s3_object}'.zip' .
-    unzip ${s3_object} && mv ${unzipped}/AmazonEI_Tensorflow_Serving_v${version}_v1 container/
-    rm ${s3_object}.zip && rm -rf ${unzipped}
+    find . -name AmazonEI_TensorFlow_Serving_v${version}_v1* -exec mv {} container/ \;
+    rm ${zip_file} && rm -rf exec_dir
 }
 
 function parse_std_args() {

diff --git a/test/functional/test_elastic_inference.py b/test/functional/test_elastic_inference.py
diff --git a/test/functional/conftest.py → test/sagemaker/conftest.py b/test/functional/conftest.py → test/sagemaker/conftest.py
@@ -28,7 +28,7 @@
 
 def pytest_addoption(parser):
     parser.addoption('--aws-id')
-    parser.addoption('--docker-base-name', default='sagemaker-tensorflow-serving')
+    parser.addoption('--docker-base-name', default='functional-tensorflow-serving')
     parser.addoption('--instance-type')
     parser.addoption('--accelerator-type', default=None)
     parser.addoption('--region', default='us-west-2')
@@ -94,7 +94,3 @@ def docker_image_uri(docker_registry, docker_image):
     uri = '{}/{}'.format(docker_registry, docker_image)
     return uri
 
-
-@pytest.fixture(scope='session')
-def sagemaker_session(region):
-    return Session(boto_session=boto3.Session(region_name=region))
diff --git a/test/sagemaker/test_elastic_inference.py b/test/sagemaker/test_elastic_inference.py
@@ -0,0 +1,114 @@
+# Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License"). You
+# may not use this file except in compliance with the License. A copy of
+# the License is located at
+#
+#     http://aws.amazon.com/apache2.0/
+#
+# or in the "license" file accompanying this file. This file is
+# distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF
+# ANY KIND, either express or implied. See the License for the specific
+# language governing permissions and limitations under the License.
+import io
+import json
+import logging
+import time
+
+import boto3
+import numpy as np
+
+import pytest
+
+EI_SUPPORTED_REGIONS = ['us-east-1', 'us-east-2', 'us-west-2', 'eu-west-1', 'ap-northeast-1', 'ap-northeast-2']
+
+logger = logging.getLogger(__name__)
+logging.getLogger('boto3').setLevel(logging.INFO)
+logging.getLogger('botocore').setLevel(logging.INFO)
+logging.getLogger('factory.py').setLevel(logging.INFO)
+logging.getLogger('auth.py').setLevel(logging.INFO)
+logging.getLogger('connectionpool.py').setLevel(logging.INFO)
+logging.getLogger('session.py').setLevel(logging.DEBUG)
+logging.getLogger('functional').setLevel(logging.DEBUG)
+
+
+@pytest.fixture(autouse=True)
+def skip_if_no_accelerator(accelerator_type):
+    if accelerator_type is None:
+        pytest.skip('Skipping because accelerator type was not provided')
+
+
+@pytest.fixture(autouse=True)
+def skip_if_non_supported_ei_region(region):
+    if region not in EI_SUPPORTED_REGIONS:
+        pytest.skip('EI is not supported in {}'.format(region))
+
+
+@pytest.fixture
+def pretrained_model_data(region):
+    return 's3://sagemaker-sample-data-{}/tensorflow/model/resnet/resnet_50_v2_fp32_NCHW.tar.gz'.format(region)
+
+
+def _timestamp():
+    return time.strftime("%Y-%m-%d-%H-%M-%S")
+
+
+def _execution_role(session):
+    return session.resource('iam').Role('SageMakerRole').arn
+
+
+def _production_variants(model_name, instance_type, accelerator_type):
+    production_variants = [{
+        'VariantName': 'AllTraffic',
+        'ModelName': model_name,
+        'InitialInstanceCount': 1,
+        'InstanceType': instance_type,
+        'AcceleratorType': accelerator_type
+    }]
+    return production_variants
+
+
+@pytest.mark.skip_if_non_supported_ei_region
+@pytest.mark.skip_if_no_accelerator
+def test_deploy_elastic_inference_with_pretrained_model(pretrained_model_data,
+                                                        docker_image_uri,
+                                                        instance_type,
+                                                        accelerator_type):
+    endpoint_name = 'test-tfs-ei-deploy-model-{}'.format(_timestamp())
+    endpoint_config_name = 'test-tfs-endpoint-config-{}'.format(_timestamp())
+    model_name = 'test-tfs-ei-model-{}'.format(_timestamp())
+
+    session = boto3.Session()
+    client = session.client('sagemaker')
+    runtime_client = session.client('runtime.sagemaker')
+    client.create_model(ModelName=model_name,
+                        ExecutionRoleArn=_execution_role(session),
+                        PrimaryContainer={
+                            'Image': docker_image_uri,
+                            'ModelDataUrl': pretrained_model_data
+                        })
+
+    logger.info('deploying model to endpoint: {}'.format(endpoint_name))
+
+    client.create_endpoint_config(EndpointConfigName=endpoint_config_name,
+                                  ProductionVariants=_production_variants(model_name, instance_type, accelerator_type))
+
+    client.create_endpoint(EndpointName=endpoint_name,
+                           EndpointConfigName=endpoint_config_name)
+
+    try:
+        client.get_waiter('endpoint_in_service').wait(EndpointName=endpoint_name)
+    finally:
+        status = client.describe_endpoint(EndpointName=endpoint_name)['EndpointStatus']
+        if status != 'InService':
+            raise Exception('Failed to create endpoint.')
+
+    input_data = {'instances': np.random.rand(1, 1, 3, 3).tolist()}
+
+    response = runtime_client.invoke_endpoint(EndpointName=endpoint_name,
+                                              ContentType='application/json',
+                                              Body=json.dumps(input_data))
+    result = json.loads(response['Body'].read().decode())
+    assert result['predictions'] is not None
+
+    client.delete_endpoint(EndpointName=endpoint_name)
diff --git a/tox.ini b/tox.ini
@@ -43,7 +43,7 @@ require-code = True
 # Can be used to specify which tests to run, e.g.: tox -- -s
 basepython = python3
 commands =
-    python -m pytest {posargs} --ignore=test/functional
+    python -m pytest {posargs} --ignore=test/sagemaker
 deps =
     pytest
     requests