aws
diff --git a/‎.github/ISSUE_TEMPLATE/bug_report.md
Lines changed: 5 additions & 2 deletions b/‎.github/ISSUE_TEMPLATE/bug_report.md
Lines changed: 5 additions & 2 deletions
diff --git a/‎README.md
Lines changed: 1 addition & 1 deletion b/‎README.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎aws_marketplace/README.md
Lines changed: 1 addition & 0 deletions b/‎aws_marketplace/README.md
Lines changed: 1 addition & 0 deletions
diff --git a/‎aws_marketplace/using_model_packages/data_quality_monitoring/data/baseline.csv
Lines changed: 301 additions & 0 deletions b/‎aws_marketplace/using_model_packages/data_quality_monitoring/data/baseline.csv
Lines changed: 301 additions & 0 deletions
diff --git a/‎aws_marketplace/using_model_packages/data_quality_monitoring/data/data_quality_drift.csv
Lines changed: 320 additions & 0 deletions b/‎aws_marketplace/using_model_packages/data_quality_monitoring/data/data_quality_drift.csv
Lines changed: 320 additions & 0 deletions
diff --git a/‎aws_marketplace/using_model_packages/data_quality_monitoring/images/s4-1-sm-studio-visualize-results-v2.png
28.4 KB b/‎aws_marketplace/using_model_packages/data_quality_monitoring/images/s4-1-sm-studio-visualize-results-v2.png
28.4 KB
diff --git a/‎aws_marketplace/using_model_packages/data_quality_monitoring/images/s4-2-monitoring-job-report-details.png
56.4 KB b/‎aws_marketplace/using_model_packages/data_quality_monitoring/images/s4-2-monitoring-job-report-details.png
56.4 KB
diff --git a/‎aws_marketplace/using_model_packages/data_quality_monitoring/images/s4-3-mm_visualize_inf_vs_baseline_stats-v2.png
67.7 KB b/‎aws_marketplace/using_model_packages/data_quality_monitoring/images/s4-3-mm_visualize_inf_vs_baseline_stats-v2.png
67.7 KB
diff --git a/‎aws_marketplace/using_model_packages/data_quality_monitoring/images/s4-3-mm_visualize_inf_vs_baseline_stats_chart-v2.png
94.4 KB b/‎aws_marketplace/using_model_packages/data_quality_monitoring/images/s4-3-mm_visualize_inf_vs_baseline_stats_chart-v2.png
94.4 KB
diff --git a/‎aws_marketplace/using_model_packages/data_quality_monitoring/monitoring_data_quality_of_models.ipynb
Lines changed: 776 additions & 0 deletions b/‎aws_marketplace/using_model_packages/data_quality_monitoring/monitoring_data_quality_of_models.ipynb
Lines changed: 776 additions & 0 deletions
diff --git a/‎aws_marketplace/using_model_packages/data_quality_monitoring/src/model_package_arns.py
Lines changed: 23 additions & 0 deletions b/‎aws_marketplace/using_model_packages/data_quality_monitoring/src/model_package_arns.py
Lines changed: 23 additions & 0 deletions
diff --git a/‎aws_sagemaker_studio/introduction_to_amazon_algorithms/xgboost_abalone/xgboost_abalone_dist_script_mode.ipynb
Lines changed: 19 additions & 10 deletions b/‎aws_sagemaker_studio/introduction_to_amazon_algorithms/xgboost_abalone/xgboost_abalone_dist_script_mode.ipynb
Lines changed: 19 additions & 10 deletions
diff --git a/‎aws_sagemaker_studio/introduction_to_amazon_algorithms/xgboost_abalone/xgboost_managed_spot_training.ipynb
Lines changed: 35 additions & 28 deletions b/‎aws_sagemaker_studio/introduction_to_amazon_algorithms/xgboost_abalone/xgboost_managed_spot_training.ipynb
Lines changed: 35 additions & 28 deletions
diff --git a/‎frameworks/mxnet/code/config.json
Lines changed: 1 addition & 0 deletions b/‎frameworks/mxnet/code/config.json
Lines changed: 1 addition & 0 deletions
@@ -8,10 +8,13 @@ assignees: ''
 ---
 
 **Link to the notebook**
-Add the link to the notebook
+Add the link to the notebook.
 
 **Describe the bug**
 A clear and concise description of what the bug is.
+Attach error logs if available.
+For security, make sure you remove or hide your
+12-digit AWS account ID when attaching the logs.
 
 **To Reproduce**
-Steps to reproduce
+Steps to reproduce.
@@ -207,7 +207,7 @@ These examples show you how to use model-packages and algorithms from AWS Market
 	- [Using models for identifying non-compliance at a workplace](aws_marketplace/using_model_packages/improving_industrial_workplace_safety) provides a detailed walkthrough on how to use pre-trained models from AWS Marketplace for extracting metadata for a sample use-case of generating summary reports for identifying non-compliance at a construction/industrial workplace.
 	- [Creative writing using GPT-2 Text Generation](aws_marketplace/using_model_packages/creative-writing-using-gpt-2-text-generation) will show you how to use AWS Marketplace GPT-2-XL pre-trained model on Amazon SageMaker to generate text based on your prompt to help you author prose and poetry.
 	- [Amazon Augmented AI with AWS Marketplace ML models](aws_marketplace/using_model_packages/amazon_augmented_ai_with_aws_marketplace_ml_models) will show you how to use AWS Marketplace pre-trained ML models with Amazon Augmented AI to implement human-in-loop workflow reviews with your ML model predictions.
-
+	- [Monitoring data quality in third-party models from AWS Marketplace](aws_marketplace/using_model_packages/data_quality_monitoring) will show you how to perform Data Quality monitoring on a pre-trained third-party model from AWS Marketplace.	
 
 ### Under Development
 
 
@@ -35,6 +35,7 @@ These examples show you how to use model-packages and algorithms from AWS Market
 	- [Using models for identifying non-compliance at a workplace](using_model_packages/improving_industrial_workplace_safety) provides a detailed walkthrough on how to use pre-trained models from AWS Marketplace for extracting metadata for a sample use-case of generating summary reports for identifying non-compliance at a construction/industrial workplace.
 	- [Creative writing using GPT-2 Text Generation](using_model_packages/creative-writing-using-gpt-2-text-generation) will show you how to use AWS Marketplace GPT-2-XL pre-trained model on Amazon SageMaker to generate text based on your prompt to help you author prose and poetry.
 	- [Amazon Augmented AI with AWS Marketplace ML models](using_model_packages/amazon_augmented_ai_with_aws_marketplace_ml_models) will show you how to use AWS Marketplace pre-trained ML models with Amazon Augmented AI to implement human-in-loop workflow reviews with your ML model predictions.
+	- [Monitoring data quality in third-party models from AWS Marketplace](using_model_packages/data_quality_monitoring) will show you how to perform Data Quality monitoring on a pre-trained third-party model from AWS Marketplace.	
 
 ## FAQ
 
 
@@ -0,0 +1,23 @@
+class ModelPackageArnProvider:
+    
+    @staticmethod
+    def get_model_package_arn(current_region):
+        mapping = {
+            "us-east-1" : "arn:aws:sagemaker:us-east-1:865070037744:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "us-east-2" : "arn:aws:sagemaker:us-east-2:057799348421:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "us-west-1" : "arn:aws:sagemaker:us-west-1:382657785993:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "us-west-2" : "arn:aws:sagemaker:us-west-2:594846645681:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "ca-central-1" : "arn:aws:sagemaker:ca-central-1:470592106596:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "eu-central-1" : "arn:aws:sagemaker:eu-central-1:446921602837:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "eu-west-1" : "arn:aws:sagemaker:eu-west-1:985815980388:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "eu-west-2" : "arn:aws:sagemaker:eu-west-2:856760150666:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "eu-west-3" : "arn:aws:sagemaker:eu-west-3:843114510376:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "eu-north-1" : "arn:aws:sagemaker:eu-north-1:136758871317:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "ap-southeast-1" : "arn:aws:sagemaker:ap-southeast-1:192199979996:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "ap-southeast-2" : "arn:aws:sagemaker:ap-southeast-2:666831318237:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "ap-northeast-2" : "arn:aws:sagemaker:ap-northeast-2:745090734665:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "ap-northeast-1" : "arn:aws:sagemaker:ap-northeast-1:977537786026:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "ap-south-1" : "arn:aws:sagemaker:ap-south-1:077584701553:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43",
+            "sa-east-1" : "arn:aws:sagemaker:sa-east-1:270155090741:model-package/planning-to-buy-house-basic-28fcb3ca751705854a7171b255d8ef43"
+        }
+        return mapping[current_region]            
@@ -47,7 +47,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# ensure sagemaker version >= 1.35.0\n",
+    "# ensure sagemaker version >= 2.00.0\n",
     "!pip show sagemaker"
    ]
   },
@@ -358,7 +358,7 @@
     "\n",
     "* __entry_point__: The path to the Python script SageMaker runs for training and prediction.\n",
     "* __role__: Role ARN\n",
-    "* __train_instance_type__ *(optional)*: The type of SageMaker instances for training. __Note__: Because Scikit-learn does not natively support GPU training, Sagemaker Scikit-learn does not currently support training on GPU instance types.\n",
+    "* __instance_type__ *(optional)*: The type of SageMaker instances for training. __Note__: Because Scikit-learn does not natively support GPU training, Sagemaker Scikit-learn does not currently support training on GPU instance types.\n",
     "* __sagemaker_session__ *(optional)*: The session used to train on Sagemaker.\n",
     "* __hyperparameters__ *(optional)*: A dictionary passed to the train function as hyperparameters."
    ]
@@ -391,7 +391,7 @@
    "outputs": [],
    "source": [
     "# Open Source distributed script mode\n",
-    "from sagemaker.session import s3_input, Session\n",
+    "from sagemaker.session import TrainingInput, Session\n",
     "from sagemaker.xgboost.estimator import XGBoost\n",
     "\n",
     "boto_session = boto3.Session(region_name=region)\n",
@@ -403,12 +403,12 @@
     "    framework_version='0.90-1', # Note: framework_version is mandatory\n",
     "    hyperparameters=hyperparams,\n",
     "    role=role,\n",
-    "    train_instance_count=2, \n",
-    "    train_instance_type=instance_type,\n",
+    "    instance_count=2, \n",
+    "    instance_type=instance_type,\n",
     "    output_path=output_path)\n",
     "\n",
-    "train_input = s3_input(\"s3://{}/{}/{}/\".format(bucket, prefix, 'train'), content_type=content_type)\n",
-    "validation_input = s3_input(\"s3://{}/{}/{}/\".format(bucket, prefix, 'validation'), content_type=content_type)"
+    "train_input = TrainingInput(\"s3://{}/{}/{}/\".format(bucket, prefix, 'train'), content_type=content_type)\n",
+    "validation_input = TrainingInput(\"s3://{}/{}/{}/\".format(bucket, prefix, 'validation'), content_type=content_type)"
    ]
   },
   {
@@ -449,9 +449,11 @@
    "metadata": {},
    "outputs": [],
    "source": [
+    "from sagemaker.serializers import CSVSerializer\n",
+    "\n",
     "predictor = xgb_script_mode_estimator.deploy(initial_instance_count=1, \n",
-    "                                             instance_type=\"ml.m5.2xlarge\")\n",
-    "predictor.serializer = str"
+    "                                             instance_type=\"ml.m5.2xlarge\",\n",
+    "                                             serializer=CSVSerializer())"
    ]
   },
   {
@@ -496,6 +498,13 @@
    "source": [
     "xgb_script_mode_estimator.delete_endpoint()"
    ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
   }
  ],
  "metadata": {
@@ -504,7 +513,7 @@
   "kernelspec": {
    "display_name": "Python 3 (Data Science)",
    "language": "python",
-   "name": "python3__SAGEMAKER_INTERNAL__arn:aws:sagemaker:us-west-2:236514542706:image/datascience-1.0"
+   "name": "python3__SAGEMAKER_INTERNAL__arn:aws:sagemaker:us-east-1:081325390199:image/datascience-1.0"
   },
   "language_info": {
    "codemirror_mode": {
 
@@ -91,8 +91,8 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "from sagemaker.amazon.amazon_estimator import get_image_uri\n",
-    "container = get_image_uri(region, 'xgboost', '0.90-1')"
+    "from sagemaker.image_uris import retrieve\n",
+    "container = retrieve('xgboost', boto3.Session().region_name, '0.90-1')"
    ]
   },
   {
@@ -108,7 +108,7 @@
     "* __entry_point__: The path to the Python script SageMaker runs for training and prediction.\n",
     "* __role__: Role ARN\n",
     "* __hyperparameters__: A dictionary passed to the train function as hyperparameters.\n",
-    "* __train_instance_type__ *(optional)*: The type of SageMaker instances for training. __Note__: This particular mode does not currently support training on GPU instance types.\n",
+    "* __instance_type__ *(optional)*: The type of SageMaker instances for training. __Note__: This particular mode does not currently support training on GPU instance types.\n",
     "* __sagemaker_session__ *(optional)*: The session used to train on Sagemaker."
    ]
   },
@@ -141,15 +141,15 @@
     "\n",
     "To enable checkpointing for Managed Spot Training using SageMaker XGBoost we need to configure three things: \n",
     "\n",
-    "1. Enable the `train_use_spot_instances` constructor arg - a simple self-explanatory boolean. \n",
+    "1. Enable the `use_spot_instances` constructor arg - a simple self-explanatory boolean. \n",
     "\n",
-    "2. Set the `train_max_wait constructor` arg - this is an int arg representing the amount of time you are willing to wait for Spot infrastructure to become available. Some instance types are harder to get at Spot prices and you may have to wait longer. You are not charged for time spent waiting for Spot infrastructure to become available, you're only charged for actual compute time spent once Spot instances have been successfully procured. \n",
+    "2. Set the `max_wait constructor` arg - this is an int arg representing the amount of time you are willing to wait for Spot infrastructure to become available. Some instance types are harder to get at Spot prices and you may have to wait longer. You are not charged for time spent waiting for Spot infrastructure to become available, you're only charged for actual compute time spent once Spot instances have been successfully procured. \n",
     "\n",
     "3. Setup a `checkpoint_s3_uri` constructor arg - this arg will tell SageMaker an S3 location where to save checkpoints. While not strictly necessary, checkpointing is highly recommended for Manage Spot Training jobs due to the fact that Spot instances can be interrupted with short notice and using checkpoints to resume from the last interruption ensures you don't lose any progress made before the interruption.\n",
     "\n",
-    "Feel free to toggle the `train_use_spot_instances` variable to see the effect of running the same job using regular (a.k.a. \"On Demand\") infrastructure.\n",
+    "Feel free to toggle the `use_spot_instances` variable to see the effect of running the same job using regular (a.k.a. \"On Demand\") infrastructure.\n",
     "\n",
-    "Note that `train_max_wait` can be set if and only if `train_use_spot_instances` is enabled and must be greater than or equal to `train_max_run`."
+    "Note that `max_wait` can be set if and only if `use_spot_instances` is enabled and must be greater than or equal to `max_run`."
    ]
   },
   {
@@ -163,27 +163,27 @@
     "job_name = 'DEMO-xgboost-spot-' + time.strftime(\"%Y-%m-%d-%H-%M-%S\", time.gmtime())\n",
     "print(\"Training job\", job_name)\n",
     "\n",
-    "train_use_spot_instances = True\n",
-    "train_max_run = 3600\n",
-    "train_max_wait = 7200 if train_use_spot_instances else None\n",
-    "checkpoint_s3_uri = ('s3://{}/{}/checkpoints/{}'.format(bucket, prefix, job_name) if train_use_spot_instances \n",
+    "use_spot_instances = True\n",
+    "max_run = 3600\n",
+    "max_wait = 7200 if use_spot_instances else None\n",
+    "checkpoint_s3_uri = ('s3://{}/{}/checkpoints/{}'.format(bucket, prefix, job_name) if use_spot_instances \n",
     "                      else None)\n",
     "print(\"Checkpoint path:\", checkpoint_s3_uri)\n",
     "\n",
     "estimator = sagemaker.estimator.Estimator(container, \n",
     "                                          role, \n",
     "                                          hyperparameters=hyperparameters,\n",
-    "                                          train_instance_count=1, \n",
-    "                                          train_instance_type=instance_type, \n",
-    "                                          train_volume_size=5,         # 5 GB \n",
+    "                                          instance_count=1, \n",
+    "                                          instance_type=instance_type, \n",
+    "                                          volume_size=5,         # 5 GB \n",
     "                                          output_path=output_path, \n",
     "                                          sagemaker_session=sagemaker.Session(),\n",
-    "                                          train_use_spot_instances=train_use_spot_instances, \n",
-    "                                          train_max_run=train_max_run, \n",
-    "                                          train_max_wait=train_max_wait,\n",
+    "                                          use_spot_instances=use_spot_instances, \n",
+    "                                          max_run=max_run, \n",
+    "                                          max_wait=max_wait,\n",
     "                                          checkpoint_s3_uri=checkpoint_s3_uri\n",
     "                                         );\n",
-    "train_input = sagemaker.s3_input(s3_data='s3://{}/{}/{}'.format(bucket, prefix, 'train'), content_type='libsvm')\n",
+    "train_input = sagemaker.TrainingInput(s3_data='s3://{}/{}/{}'.format(bucket, prefix, 'train'), content_type='libsvm')\n",
     "estimator.fit({'train': train_input}, job_name=job_name)"
    ]
   },
@@ -197,7 +197,7 @@
     "- `Training seconds: X` : This is the actual compute-time your training job spent\n",
     "- `Billable seconds: Y` : This is the time you will be billed for after Spot discounting is applied.\n",
     "\n",
-    "If you enabled the `train_use_spot_instances`, then you should see a notable difference between `X` and `Y` signifying the cost savings you will get for having chosen Managed Spot Training. This should be reflected in an additional line:\n",
+    "If you enabled the `use_spot_instances`, then you should see a notable difference between `X` and `Y` signifying the cost savings you will get for having chosen Managed Spot Training. This should be reflected in an additional line:\n",
     "- `Managed Spot Training savings: (1-Y/X)*100 %`"
    ]
   },
@@ -261,22 +261,22 @@
     "\n",
     "job_name = 'DEMO-xgboost-regression-' + time.strftime(\"%Y-%m-%d-%H-%M-%S\", time.gmtime())\n",
     "print(\"Training job\", job_name)\n",
-    "checkpoint_s3_uri = ('s3://{}/{}/checkpoints/{}'.format(bucket, prefix, job_name) if train_use_spot_instances \n",
+    "checkpoint_s3_uri = ('s3://{}/{}/checkpoints/{}'.format(bucket, prefix, job_name) if use_spot_instances \n",
     "                      else None)\n",
     "print(\"Checkpoint path:\", checkpoint_s3_uri)\n",
     "\n",
     "xgb_script_mode_estimator = XGBoost(\n",
     "    entry_point=\"abalone.py\",\n",
     "    hyperparameters=hyperparameters,\n",
-    "    image_name=container,\n",
+    "    image_uri=container,\n",
     "    role=role, \n",
-    "    train_instance_count=1,\n",
-    "    train_instance_type=instance_type,\n",
+    "    instance_count=1,\n",
+    "    instance_type=instance_type,\n",
     "    framework_version=\"0.90-1\",\n",
     "    output_path=\"s3://{}/{}/{}/output\".format(bucket, prefix, \"xgboost-script-mode\"),\n",
-    "    train_use_spot_instances=train_use_spot_instances,\n",
-    "    train_max_run=train_max_run,\n",
-    "    train_max_wait=train_max_wait,\n",
+    "    use_spot_instances=use_spot_instances,\n",
+    "    max_run=max_run,\n",
+    "    max_wait=max_wait,\n",
     "    checkpoint_s3_uri=checkpoint_s3_uri\n",
     ")"
    ]
@@ -296,6 +296,13 @@
    "source": [
     "xgb_script_mode_estimator.fit({'train': train_input, 'validation': train_input}, job_name=job_name)"
    ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
   }
  ],
  "metadata": {
@@ -304,7 +311,7 @@
   "kernelspec": {
    "display_name": "Python 3 (Data Science)",
    "language": "python",
-   "name": "python3__SAGEMAKER_INTERNAL__arn:aws:sagemaker:us-west-2:236514542706:image/datascience-1.0"
+   "name": "python3__SAGEMAKER_INTERNAL__arn:aws:sagemaker:us-east-1:081325390199:image/datascience-1.0"
   },
   "language_info": {
    "codemirror_mode": {
@@ -321,4 +328,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
+}
@@ -0,0 +1 @@
+../../../config.json