feature: allow custom model name during deploy

imujjwal96 · imujjwal96 · commit 44336fc55dc7 · 2019-06-14T08:44:56.000Z
diff --git a/src/sagemaker/estimator.py b/src/sagemaker/estimator.py
@@ -331,7 +331,7 @@ def attach(cls, training_job_name, sagemaker_session=None, model_channel_name='m
         return estimator
 
     def deploy(self, initial_instance_count, instance_type, accelerator_type=None, endpoint_name=None,
-               use_compiled_model=False, update_endpoint=False, wait=True, **kwargs):
+               use_compiled_model=False, update_endpoint=False, wait=True, model_name=None, **kwargs):
         """Deploy the trained model to an Amazon SageMaker endpoint and return a ``sagemaker.RealTimePredictor`` object.
 
         More information:
@@ -351,11 +351,13 @@ def deploy(self, initial_instance_count, instance_type, accelerator_type=None, e
             update_endpoint (bool): Flag to update the model in an existing Amazon SageMaker endpoint.
                 If True, this will deploy a new EndpointConfig to an already existing endpoint and delete resources
                 corresponding to the previous EndpointConfig. Default: False
+            wait (bool): Whether the call should wait until the deployment of model completes (default: True).
+            model_name (str): Name to use for creating an Amazon SageMaker model. If not specified, the name of
+                the training job is used.
             tags(List[dict[str, str]]): Optional. The list of tags to attach to this specific endpoint. Example:
                     >>> tags = [{'Key': 'tagname', 'Value': 'tagvalue'}]
                     For more information about tags, see https://boto3.amazonaws.com/v1/documentation\
                     /api/latest/reference/services/sagemaker.html#SageMaker.Client.add_tags
-            wait (bool): Whether the call should wait until the deployment of model completes (default: True).
 
             **kwargs: Passed to invocation of ``create_model()``. Implementations may customize
                 ``create_model()`` to accept ``**kwargs`` to customize model creation during deploy.
@@ -367,6 +369,7 @@ def deploy(self, initial_instance_count, instance_type, accelerator_type=None, e
         """
         self._ensure_latest_training_job()
         endpoint_name = endpoint_name or self.latest_training_job.name
+        model_name = model_name or self.latest_training_job.name
         self.deploy_instance_type = instance_type
         if use_compiled_model:
             family = '_'.join(instance_type.split('.')[:-1])
@@ -376,6 +379,7 @@ def deploy(self, initial_instance_count, instance_type, accelerator_type=None, e
             model = self._compiled_models[family]
         else:
             model = self.create_model(**kwargs)
+        model.name = model_name
         return model.deploy(
             instance_type=instance_type,
             initial_instance_count=initial_instance_count,
diff --git a/src/sagemaker/tuner.py b/src/sagemaker/tuner.py
@@ -327,7 +327,7 @@ def attach(cls, tuning_job_name, sagemaker_session=None, job_details=None, estim
         return tuner
 
     def deploy(self, initial_instance_count, instance_type, accelerator_type=None, endpoint_name=None, wait=True,
-               **kwargs):
+               model_name=None, **kwargs):
         """Deploy the best trained or user specified model to an Amazon SageMaker endpoint and return a
         ``sagemaker.RealTimePredictor`` object.
 
@@ -344,6 +344,8 @@ def deploy(self, initial_instance_count, instance_type, accelerator_type=None, e
             endpoint_name (str): Name to use for creating an Amazon SageMaker endpoint. If not specified,
                 the name of the training job is used.
             wait (bool): Whether the call should wait until the deployment of model completes (default: True).
+            model_name (str): Name to use for creating an Amazon SageMaker model. If not specified, the name of
+                the training job is used.
             **kwargs: Other arguments needed for deployment. Please refer to the ``create_model()`` method of
                 the associated estimator to see what other arguments are needed.
 
@@ -356,7 +358,7 @@ def deploy(self, initial_instance_count, instance_type, accelerator_type=None, e
                                                sagemaker_session=self.estimator.sagemaker_session)
         return best_estimator.deploy(initial_instance_count, instance_type,
                                      accelerator_type=accelerator_type,
-                                     endpoint_name=endpoint_name, wait=wait, **kwargs)
+                                     endpoint_name=endpoint_name, wait=wait, model_name=model_name, **kwargs)
 
     def stop_tuning_job(self):
         """Stop latest running hyperparameter tuning job.
diff --git a/tests/integ/test_tf_script_mode.py b/tests/integ/test_tf_script_mode.py
@@ -136,19 +136,21 @@ def test_mnist_async(sagemaker_session):
     training_job_name = estimator.latest_training_job.name
     time.sleep(20)
     endpoint_name = training_job_name
+    model_name = 'model-name-1'
     _assert_training_job_tags_match(sagemaker_session.sagemaker_client,
                                     estimator.latest_training_job.name, TAGS)
     with tests.integ.timeout.timeout_and_delete_endpoint_by_name(endpoint_name, sagemaker_session):
         estimator = TensorFlow.attach(training_job_name=training_job_name,
                                       sagemaker_session=sagemaker_session)
         predictor = estimator.deploy(initial_instance_count=1, instance_type='ml.c4.xlarge',
-                                     endpoint_name=endpoint_name)
+                                     endpoint_name=endpoint_name, model_name=model_name)
 
         result = predictor.predict(np.zeros(784))
         print('predict result: {}'.format(result))
         _assert_endpoint_tags_match(sagemaker_session.sagemaker_client, predictor.endpoint, TAGS)
         _assert_model_tags_match(sagemaker_session.sagemaker_client,
                                  estimator.latest_training_job.name, TAGS)
+        _assert_model_name_match(sagemaker_session.sagemaker_client, endpoint_name, model_name)
 
 
 def test_deploy_with_input_handlers(sagemaker_session, instance_type):
@@ -208,3 +210,8 @@ def _assert_training_job_tags_match(sagemaker_client, training_job_name, tags):
     training_job_description = sagemaker_client.describe_training_job(
         TrainingJobName=training_job_name)
     _assert_tags_match(sagemaker_client, training_job_description['TrainingJobArn'], tags)
+
+
+def _assert_model_name_match(sagemaker_client, endpoint_config_name, model_name):
+    endpoint_config_description = sagemaker_client.describe_endpoint_config(EndpointConfigName=endpoint_config_name)
+    assert model_name == endpoint_config_description['ProductionVariants'][0]['ModelName']
diff --git a/tests/integ/test_tuner.py b/tests/integ/test_tuner.py
@@ -660,13 +660,15 @@ def test_attach_tuning_pytorch(sagemaker_session):
         time.sleep(15)
         tuner.wait()
 
+    endpoint_name = tuning_job_name
+    model_name = 'model-name-1'
     attached_tuner = HyperparameterTuner.attach(tuning_job_name,
                                                 sagemaker_session=sagemaker_session)
     assert attached_tuner.early_stopping_type == 'Auto'
 
     best_training_job = tuner.best_training_job()
-    with timeout_and_delete_endpoint_by_name(best_training_job, sagemaker_session):
-        predictor = attached_tuner.deploy(1, 'ml.c4.xlarge')
+    with timeout_and_delete_endpoint_by_name(endpoint_name, sagemaker_session):
+        predictor = attached_tuner.deploy(1, 'ml.c4.xlarge', endpoint_name=endpoint_name, model_name=model_name)
         data = np.zeros(shape=(1, 1, 28, 28), dtype=np.float32)
         predictor.predict(data)
 
@@ -675,6 +677,7 @@ def test_attach_tuning_pytorch(sagemaker_session):
         output = predictor.predict(data)
 
         assert output.shape == (batch_size, 10)
+        _assert_model_name_match(sagemaker_session.sagemaker_client, endpoint_name, model_name)
 
 
 @pytest.mark.canary_quick
@@ -749,3 +752,8 @@ def _fm_serializer(data):
     for row in data:
         js['instances'].append({'features': row.tolist()})
     return json.dumps(js)
+
+
+def _assert_model_name_match(sagemaker_client, endpoint_config_name, model_name):
+    endpoint_config_description = sagemaker_client.describe_endpoint_config(EndpointConfigName=endpoint_config_name)
+    assert model_name == endpoint_config_description['ProductionVariants'][0]['ModelName']
diff --git a/tests/unit/test_estimator.py b/tests/unit/test_estimator.py
@@ -1140,6 +1140,31 @@ def test_deploy_with_update_endpoint(sagemaker_session):
     sagemaker_session.create_endpoint.assert_not_called()
 
 
+def test_deploy_with_model_name(sagemaker_session):
+    estimator = Estimator(IMAGE_NAME, ROLE, INSTANCE_COUNT, INSTANCE_TYPE, output_path=OUTPUT_PATH,
+                          sagemaker_session=sagemaker_session)
+    estimator.set_hyperparameters(**HYPERPARAMS)
+    estimator.fit({'train': 's3://bucket/training-prefix'})
+    model_name = 'model-name'
+    estimator.deploy(INSTANCE_COUNT, INSTANCE_TYPE, model_name=model_name)
+
+    sagemaker_session.create_model.assert_called_once()
+    args, kwargs = sagemaker_session.create_model.call_args
+    assert args[0] == model_name
+
+
+def test_deploy_with_no_model_name(sagemaker_session):
+    estimator = Estimator(IMAGE_NAME, ROLE, INSTANCE_COUNT, INSTANCE_TYPE, output_path=OUTPUT_PATH,
+                          sagemaker_session=sagemaker_session)
+    estimator.set_hyperparameters(**HYPERPARAMS)
+    estimator.fit({'train': 's3://bucket/training-prefix'})
+    estimator.deploy(INSTANCE_COUNT, INSTANCE_TYPE)
+
+    sagemaker_session.create_model.assert_called_once()
+    args, kwargs = sagemaker_session.create_model.call_args
+    assert args[0].startswith(IMAGE_NAME)
+
+
 @patch('sagemaker.estimator.LocalSession')
 @patch('sagemaker.estimator.Session')
 def test_local_mode(session_class, local_session_class):
diff --git a/tests/unit/test_tuner.py b/tests/unit/test_tuner.py
@@ -566,7 +566,8 @@ def test_deploy_default(tuner):
 
     tuner.estimator.sagemaker_session.create_model.assert_called_once()
     args = tuner.estimator.sagemaker_session.create_model.call_args[0]
-    assert args[0].startswith(IMAGE_NAME)
+
+    assert args[0] == 'neo'
     assert args[1] == ROLE
     assert args[2]['Image'] == IMAGE_NAME
     assert args[2]['ModelDataUrl'] == MODEL_DATA