From 7a6d1cec29f031785e62dbd42d37e5d8b0f38cae Mon Sep 17 00:00:00 2001 From: Ruilian Gao Date: Wed, 5 Feb 2025 00:05:25 +0000 Subject: [PATCH] Fix multiple IC support in modelBuilder --- src/sagemaker/serve/builder/model_builder.py | 2 +- tests/unit/sagemaker/serve/builder/test_model_builder.py | 1 + 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/src/sagemaker/serve/builder/model_builder.py b/src/sagemaker/serve/builder/model_builder.py index a7a518105c..2ea331ee4c 100644 --- a/src/sagemaker/serve/builder/model_builder.py +++ b/src/sagemaker/serve/builder/model_builder.py @@ -1621,7 +1621,6 @@ def deploy( """ if not hasattr(self, "built_model"): raise ValueError("Model Needs to be built before deploying") - endpoint_name = unique_name_from_base(endpoint_name) if not inference_config: # Real-time Deployment return self.built_model.deploy( instance_type=self.instance_type, @@ -1655,6 +1654,7 @@ def deploy( # Multi Model and MultiContainer endpoints with Inference Component return self.built_model.deploy( instance_type=self.instance_type, + endpoint_name=endpoint_name, mode=Mode.SAGEMAKER_ENDPOINT, endpoint_type=EndpointType.INFERENCE_COMPONENT_BASED, resources=inference_config, diff --git a/tests/unit/sagemaker/serve/builder/test_model_builder.py b/tests/unit/sagemaker/serve/builder/test_model_builder.py index 107d65c301..b7c38fad68 100644 --- a/tests/unit/sagemaker/serve/builder/test_model_builder.py +++ b/tests/unit/sagemaker/serve/builder/test_model_builder.py @@ -4080,6 +4080,7 @@ def test_neuron_configurations_rule_set(self): "instance_type": "ml.g5.2xlarge", "mode": Mode.SAGEMAKER_ENDPOINT, "endpoint_type": EndpointType.INFERENCE_COMPONENT_BASED, + "endpoint_name": "test", }, }, {