Model and Estimator UTs

chiui0x18 · chiui0x18 · commit a9f61e32cbce · 2022-10-25T09:16:06.000-07:00
diff --git a/tests/unit/sagemaker/model/test_deploy.py b/tests/unit/sagemaker/model/test_deploy.py
@@ -483,3 +483,64 @@ def test_deploy_predictor_cls(production_variant, sagemaker_session):
     assert predictor_async.name == model.name
     assert predictor_async.endpoint_name == endpoint_name_async
     assert predictor_async.sagemaker_session == sagemaker_session
+
+@patch("sagemaker.production_variant")
+@patch("sagemaker.model.Model.prepare_container_def")
+@patch("sagemaker.utils.name_from_base", return_value=MODEL_NAME)
+def test_deploy_customized_volume_size_and_timeout(name_from_base, prepare_container_def, production_variant, sagemaker_session):
+    volume_size_gb = 256
+    model_data_download_timeout_sec = 1800
+    startup_health_check_timeout_sec = 1800
+
+    production_variant_result = copy.deepcopy(BASE_PRODUCTION_VARIANT)
+    production_variant_result.update({
+        'VolumeSizeInGB': volume_size_gb,
+        'ModelDataDownloadTimeoutInSeconds': model_data_download_timeout_sec,
+        'ContainerStartupHealthCheckTimeoutInSeconds': startup_health_check_timeout_sec,
+    })
+    production_variant.return_value = production_variant_result
+
+    container_def = {"Image": MODEL_IMAGE, "Environment": {}, "ModelDataUrl": MODEL_DATA}
+    prepare_container_def.return_value = container_def
+
+    model = Model(MODEL_IMAGE, MODEL_DATA, role=ROLE, sagemaker_session=sagemaker_session)
+    model.deploy(instance_type=INSTANCE_TYPE, initial_instance_count=INSTANCE_COUNT,
+                 volume_size=volume_size_gb,
+                 model_data_download_timeout=model_data_download_timeout_sec,
+                 container_startup_health_check_timeout=startup_health_check_timeout_sec)
+
+    name_from_base.assert_called_with(MODEL_IMAGE)
+    assert 2 == name_from_base.call_count
+
+    prepare_container_def.assert_called_with(
+        INSTANCE_TYPE, accelerator_type=None, serverless_inference_config=None
+    )
+    production_variant.assert_called_with(
+        MODEL_NAME,
+        INSTANCE_TYPE,
+        INSTANCE_COUNT,
+        accelerator_type=None,
+        serverless_inference_config=None,
+        volume_size=volume_size_gb,
+        model_data_download_timeout=model_data_download_timeout_sec,
+        container_startup_health_check_timeout=startup_health_check_timeout_sec,
+    )
+
+    sagemaker_session.create_model.assert_called_with(
+        name=MODEL_NAME,
+        role=ROLE,
+        container_defs=container_def,
+        vpc_config=None,
+        enable_network_isolation=False,
+        tags=None,
+    )
+
+    sagemaker_session.endpoint_from_production_variants.assert_called_with(
+        name=MODEL_NAME,
+        production_variants=[production_variant_result],
+        tags=None,
+        kms_key=None,
+        wait=True,
+        data_capture_config_dict=None,
+        async_inference_config_dict=None,
+    )
diff --git a/tests/unit/test_estimator.py b/tests/unit/test_estimator.py
@@ -3312,6 +3312,50 @@ def test_deploy_with_no_model_name(sagemaker_session):
     assert kwargs["name"].startswith(IMAGE_URI)
 
 
+@patch("sagemaker.estimator.Estimator.create_model")
+def test_deploy_with_customized_volume_size_timeout(create_model, sagemaker_session):
+    estimator = Estimator(
+        IMAGE_URI,
+        ROLE,
+        INSTANCE_COUNT,
+        INSTANCE_TYPE,
+        output_path=OUTPUT_PATH,
+        sagemaker_session=sagemaker_session,
+    )
+    estimator.set_hyperparameters(**HYPERPARAMS)
+    estimator.fit({"train": "s3://bucket/training-prefix"})
+    endpoint_name = "endpoint-name"
+    volume_size_gb = 256
+    model_data_download_timeout_sec = 600
+    startup_health_check_timeout_sec = 600
+
+    model = MagicMock()
+    create_model.return_value = model
+
+    estimator.deploy(INSTANCE_COUNT, INSTANCE_TYPE, endpoint_name=endpoint_name,
+                     volume_size=volume_size_gb,
+                     model_data_download_timeout=model_data_download_timeout_sec,
+                     container_startup_health_check_timeout=startup_health_check_timeout_sec)
+
+    model.deploy.assert_called_with(
+        instance_type=INSTANCE_TYPE,
+        initial_instance_count=INSTANCE_COUNT,
+        serializer=None,
+        deserializer=None,
+        accelerator_type=None,
+        endpoint_name=endpoint_name,
+        tags=None,
+        wait=True,
+        kms_key=None,
+        data_capture_config=None,
+        async_inference_config=None,
+        serverless_inference_config=None,
+        volume_size=volume_size_gb,
+        model_data_download_timeout=model_data_download_timeout_sec,
+        container_startup_health_check_timeout=startup_health_check_timeout_sec,
+    )
+
+
 def test_register_default_image(sagemaker_session):
     estimator = Estimator(
         IMAGE_URI,