Merge pull request aws#23 from awslabs/tf_byom

djarpin · web-flow · commit 767e58a33be5 · 2017-11-21T16:51:02.000-08:00
Tensorflow Bring Your Own Model.

Merging in preparation for tomorrow's meeting.
diff --git a/README.md b/README.md
@@ -18,3 +18,4 @@ This repository contains example notebooks that show how to apply machine learni
 - [Installing the R Kernel](install_r_kernel) shows how to install the R kernel into an Amazon SageMaker Notebook Instance.
 - [Bring Your Own Model for k-means](kmeans_bring_your_own_model) shows how to take a model that's been fit elsewhere and use Amazon SageMaker containers to host.
 - [Bring Your Own Algorithm with R](r_bring_your_own) shows how to bring your own algorithm container to Amazon SageMaker using the R language.
+- [Bring Your Own Tensorflow Model](sagemaker-python-sdk/tensorflow_iris_byom) shows how to bring a model trained anywhere into Amazon SageMaker
diff --git a/sagemaker-python-sdk/mxnet_mnist_byom/mnist.py b/sagemaker-python-sdk/mxnet_mnist_byom/mnist.py
@@ -0,0 +1,52 @@
+import logging
+
+import gzip
+import mxnet as mx
+import numpy as np
+import os
+import struct
+
+
+def find_file(root_path, file_name):
+    for root, dirs, files in os.walk(root_path):
+        if file_name in files:
+            return os.path.join(root, file_name)
+
+
+def build_graph():
+    data = mx.sym.var('data')
+    data = mx.sym.flatten(data=data)
+    fc1 = mx.sym.FullyConnected(data=data, num_hidden=128)
+    act1 = mx.sym.Activation(data=fc1, act_type="relu")
+    fc2 = mx.sym.FullyConnected(data=act1, num_hidden=64)
+    act2 = mx.sym.Activation(data=fc2, act_type="relu")
+    fc3 = mx.sym.FullyConnected(data=act2, num_hidden=10)
+    return mx.sym.SoftmaxOutput(data=fc3, name='softmax')
+
+
+def train(data, hyperparameters= {'learning_rate': 0.11}, num_cpus=0, num_gpus =1 , **kwargs):
+    train_labels = data['train_label']
+    train_images = data['train_data']
+    test_labels = data['test_label']
+    test_images = data['test_data']
+    batch_size = 100
+    train_iter = mx.io.NDArrayIter(train_images, train_labels, batch_size, shuffle=True)
+    val_iter = mx.io.NDArrayIter(test_images, test_labels, batch_size)
+    logging.getLogger().setLevel(logging.DEBUG)
+    mlp_model = mx.mod.Module(
+        symbol=build_graph(),
+        context=get_train_context(num_cpus, num_gpus))
+    mlp_model.fit(train_iter,
+                  eval_data=val_iter,
+                  optimizer='sgd',
+                  optimizer_params={'learning_rate': float(hyperparameters.get("learning_rate", 0.1))},
+                  eval_metric='acc',
+                  batch_end_callback=mx.callback.Speedometer(batch_size, 100),
+                  num_epoch=10)
+    return mlp_model
+
+
+def get_train_context(num_cpus, num_gpus):
+    if num_gpus > 0:
+        return mx.gpu()
+    return mx.cpu()
diff --git a/sagemaker-python-sdk/mxnet_mnist_byom/mxnet_mnist.ipynb b/sagemaker-python-sdk/mxnet_mnist_byom/mxnet_mnist.ipynb
@@ -0,0 +1,225 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Mxnet MNIST BYOM. Train locally and deploy on SageMaker."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "In this notebook, we will train a model locally on the notebook instance and will deploy and predict from Sagemaker. This can easily be extended to a model trained anywhere else as well. All that is needed is the exported model file and the entry point file containing model definitions. \n",
+    "\n",
+    "First, let us begin by downloading the mnist data using the mxnet utilities."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import mxnet as mx\n",
+    "data = mx.test_utils.get_mnist()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "collapsed": true
+   },
+   "source": [
+    "Train a typical mxnet model for lenet."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "from mnist import train\n",
+    "model = train(data = data)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Export the model and save it down. Analogous to the tensorflow example, some structure needs to be followed, which is explained in the following code."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "os.mkdir('model')\n",
+    "model.save_checkpoint('model/model', 0000)\n",
+    "import tarfile\n",
+    "with tarfile.open('model.tar.gz', mode='w:gz') as archive:\n",
+    "    archive.add('model', recursive=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Open a sagemaker session and upload the model on to the default S3 bucket."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import sagemaker\n",
+    "\n",
+    "sagemaker_session = sagemaker.Session()\n",
+    "inputs = sagemaker_session.upload_data(path='model.tar.gz', key_prefix='model')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Use the ``sagemaker.mxnet.model.MXNetModel`` to create a new model that can be deployed."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "from sagemaker.mxnet.model import MXNetModel\n",
+    "sagemaker_model = MXNetModel(model_data = 's3://' + sagemaker_session.default_bucket() + '/model/model.tar.gz',\n",
+    "                                  role = '<<set role here>>',\n",
+    "                                  entry_point = 'mnist.py')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Deploy the model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "predictor = sagemaker_model.deploy(initial_instance_count=1,\n",
+    "                                          instance_type='ml.c4.xlarge')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We can now use this predictor to classify hand-written digits."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "predict_sample = data['test_data'][0][0]\n",
+    "response = predictor.predict(data)\n",
+    "print('Raw prediction result:')\n",
+    "print(response)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "collapsed": true
+   },
+   "source": [
+    "(Optional) Delete the Endpoint"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "print(predictor.endpoint)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import sagemaker\n",
+    "\n",
+    "sagemaker.Session().delete_endpoint(predictor.endpoint)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "os.remove('model.tar.gz')\n",
+    "import shutil\n",
+    "shutil.rmtree('export')"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.3"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/sagemaker-python-sdk/tensorflow_iris_byom/iris_dnn_classifier.py b/sagemaker-python-sdk/tensorflow_iris_byom/iris_dnn_classifier.py
@@ -0,0 +1,41 @@
+import os
+import numpy as np
+import tensorflow as tf
+
+INPUT_TENSOR_NAME = 'x'
+
+
+def estimator_fn(run_config, params):
+    feature_columns = [tf.feature_column.numeric_column(INPUT_TENSOR_NAME, shape=[4])]
+    return tf.estimator.DNNClassifier(feature_columns=feature_columns,
+                                      hidden_units=[10, 20, 10],
+                                      n_classes=3,
+                                      config=run_config)
+
+
+def serving_input_fn():
+    feature_spec = {INPUT_TENSOR_NAME: tf.FixedLenFeature(dtype=tf.float32, shape=[4])}
+    return tf.estimator.export.build_parsing_serving_input_receiver_fn(feature_spec)()
+
+
+def train_input_fn(training_dir, params):
+    """Returns input function that would feed the model during training"""
+    return _generate_input_fn(training_dir, 'iris_training.csv')
+
+
+def eval_input_fn(training_dir, params):
+    """Returns input function that would feed the model during evaluation"""
+    return _generate_input_fn(training_dir, 'iris_test.csv')
+
+
+def _generate_input_fn(training_dir, training_filename):
+    training_set = tf.contrib.learn.datasets.base.load_csv_with_header(
+        filename=os.path.join(training_dir, training_filename),
+        target_dtype=np.int,
+        features_dtype=np.float32)
+
+    return tf.estimator.inputs.numpy_input_fn(
+        x={INPUT_TENSOR_NAME: np.array(training_set.data)},
+        y=np.array(training_set.target),
+        num_epochs=None,
+        shuffle=True)
diff --git a/sagemaker-python-sdk/tensorflow_iris_byom/tensorflow_BYOM_iris.ipynb b/sagemaker-python-sdk/tensorflow_iris_byom/tensorflow_BYOM_iris.ipynb