aws
diff --git a/‎src/sagemaker/huggingface/llm_utils.py
+2-1 b/‎src/sagemaker/huggingface/llm_utils.py
+2-1
diff --git a/‎src/sagemaker/serve/builder/model_builder.py
+14-5 b/‎src/sagemaker/serve/builder/model_builder.py
+14-5
diff --git a/‎src/sagemaker/serve/schema/task.json
+20-20 b/‎src/sagemaker/serve/schema/task.json
+20-20
diff --git a/‎tests/integ/sagemaker/serve/test_schema_builder.py
+66 b/‎tests/integ/sagemaker/serve/test_schema_builder.py
+66
diff --git a/‎tests/unit/sagemaker/feature_store/feature_processor/test_data_helpers.py
+14 b/‎tests/unit/sagemaker/feature_store/feature_processor/test_data_helpers.py
+14
diff --git a/‎tests/unit/sagemaker/feature_store/feature_processor/test_validation.py
+1-3 b/‎tests/unit/sagemaker/feature_store/feature_processor/test_validation.py
+1-3
diff --git a/‎tests/unit/sagemaker/remote_function/core/test_stored_function.py
+1-2 b/‎tests/unit/sagemaker/remote_function/core/test_stored_function.py
+1-2
@@ -81,7 +81,8 @@ def get_huggingface_model_metadata(model_id: str, hf_hub_token: Optional[str] =
     Returns:
         dict: The model metadata retrieved with the HuggingFace API
     """
-
+    if not model_id:
+        raise ValueError("Model ID is empty. Please provide a valid Model ID.")
     hf_model_metadata_url = f"https://huggingface.co/api/models/{model_id}"
     hf_model_metadata_json = None
     try:
 
@@ -124,8 +124,8 @@ class ModelBuilder(Triton, DJL, JumpStart, TGI, Transformers):
             into a stream. All translations between the server and the client are handled
             automatically with the specified input and output.
         model (Optional[Union[object, str]): Model object (with ``predict`` method to perform
-            inference) or a HuggingFace/JumpStart Model ID. Either ``model`` or
-            ``inference_spec`` is required for the model builder to build the artifact.
+            inference) or a HuggingFace/JumpStart Model ID. Either ``model`` or ``inference_spec``
+            is required for the model builder to build the artifact.
         inference_spec (InferenceSpec): The inference spec file with your customized
             ``invoke`` and ``load`` functions.
         image_uri (Optional[str]): The container image uri (which is derived from a
@@ -145,6 +145,8 @@ class ModelBuilder(Triton, DJL, JumpStart, TGI, Transformers):
             to the model server). Possible values for this argument are
             ``TORCHSERVE``, ``MMS``, ``TENSORFLOW_SERVING``, ``DJL_SERVING``,
             ``TRITON``, and``TGI``.
+        model_metadata (Optional[Dict[str, Any]): Dictionary used to override the HuggingFace
+            model metadata. Currently ``HF_TASK`` is overridable.
     """
 
     model_path: Optional[str] = field(
@@ -241,6 +243,10 @@ class ModelBuilder(Triton, DJL, JumpStart, TGI, Transformers):
     model_server: Optional[ModelServer] = field(
         default=None, metadata={"help": "Define the model server to deploy to."}
     )
+    model_metadata: Optional[Dict[str, Any]] = field(
+        default=None,
+        metadata={"help": "Define the model metadata to override, currently supports `HF_TASK`"},
+    )
 
     def _build_validations(self):
         """Placeholder docstring"""
@@ -616,6 +622,9 @@ def build(  # pylint: disable=R0911
         self._is_custom_image_uri = self.image_uri is not None
 
         if isinstance(self.model, str):
+            model_task = None
+            if self.model_metadata:
+                model_task = self.model_metadata.get("HF_TASK")
             if self._is_jumpstart_model_id():
                 return self._build_for_jumpstart()
             if self._is_djl():  # pylint: disable=R1705
@@ -625,10 +634,10 @@ def build(  # pylint: disable=R0911
                     self.model, self.env_vars.get("HUGGING_FACE_HUB_TOKEN")
                 )
 
-                model_task = hf_model_md.get("pipeline_tag")
-                if self.schema_builder is None and model_task:
+                if model_task is None:
+                    model_task = hf_model_md.get("pipeline_tag")
+                if self.schema_builder is None and model_task is not None:
                     self._schema_builder_init(model_task)
-
                 if model_task == "text-generation":  # pylint: disable=R1705
                     return self._build_for_tgi()
                 elif self._can_fit_on_single_gpu():
 
@@ -1,28 +1,28 @@
 {
 	"fill-mask": {
-        "sample_inputs": {
+		"sample_inputs": {
 			"properties": {
 				"inputs": "Paris is the [MASK] of France.",
 				"parameters": {}
 			}
-        },
-        "sample_outputs": {
+		},
+		"sample_outputs": {
 			"properties": [
 				{
 					"sequence": "Paris is the capital of France.",
 					"score": 0.7
 				}
 			]
 		}
-    },
+	},
 	"question-answering": {
-        "sample_inputs": {
+		"sample_inputs": {
 			"properties": {
 				"context": "I have a German Shepherd dog, named Coco.",
 				"question": "What is my dog's breed?"
 			}
-        },
-        "sample_outputs": {
+		},
+		"sample_outputs": {
 			"properties": [
 				{
 					"answer": "German Shepherd",
@@ -32,36 +32,36 @@
 				}
 			]
 		}
-    },
+	},
 	"text-classification": {
-        "sample_inputs": {
+		"sample_inputs": {
 			"properties": {
 				"inputs": "Where is the capital of France?, Paris is the capital of France.",
 				"parameters": {}
 			}
-        },
-        "sample_outputs": {
+		},
+		"sample_outputs": {
 			"properties": [
 				{
 					"label": "entailment",
 					"score": 0.997
 				}
 			]
 		}
-    },
-    "text-generation": {
-        "sample_inputs": {
+	},
+	"text-generation": {
+		"sample_inputs": {
 			"properties": {
 				"inputs": "Hello, I'm a language model",
 				"parameters": {}
 			}
-        },
-        "sample_outputs": {
+		},
+		"sample_outputs": {
 			"properties": [
-				{
-					"generated_text": "Hello, I'm a language modeler. So while writing this, when I went out to meet my wife or come home she told me that my"
-				}
+			{
+				"generated_text": "Hello, I'm a language modeler. So while writing this, when I went out to meet my wife or come home she told me that my"
+			}
 			]
 		}
-    }
+	}
 }
@@ -99,3 +99,69 @@ def test_model_builder_negative_path(sagemaker_session):
         match="Error Message: Schema builder for text-to-image could not be found.",
     ):
         model_builder.build(sagemaker_session=sagemaker_session)
+
+
+@pytest.mark.skipif(
+    PYTHON_VERSION_IS_NOT_310,
+    reason="Testing Schema Builder Simplification feature",
+)
+@pytest.mark.parametrize(
+    "model_id, task_provided",
+    [
+        ("bert-base-uncased", "fill-mask"),
+        ("bert-large-uncased-whole-word-masking-finetuned-squad", "question-answering"),
+    ],
+)
+def test_model_builder_happy_path_with_task_provided(
+    model_id, task_provided, sagemaker_session, gpu_instance_type
+):
+    model_builder = ModelBuilder(model=model_id, model_metadata={"HF_TASK": task_provided})
+
+    model = model_builder.build(sagemaker_session=sagemaker_session)
+
+    assert model is not None
+    assert model_builder.schema_builder is not None
+
+    inputs, outputs = task.retrieve_local_schemas(task_provided)
+    assert model_builder.schema_builder.sample_input == inputs
+    assert model_builder.schema_builder.sample_output == outputs
+
+    with timeout(minutes=SERVE_SAGEMAKER_ENDPOINT_TIMEOUT):
+        caught_ex = None
+        try:
+            iam_client = sagemaker_session.boto_session.client("iam")
+            role_arn = iam_client.get_role(RoleName="SageMakerRole")["Role"]["Arn"]
+
+            logger.info("Deploying and predicting in SAGEMAKER_ENDPOINT mode...")
+            predictor = model.deploy(
+                role=role_arn, instance_count=1, instance_type=gpu_instance_type
+            )
+
+            predicted_outputs = predictor.predict(inputs)
+            assert predicted_outputs is not None
+
+        except Exception as e:
+            caught_ex = e
+        finally:
+            cleanup_model_resources(
+                sagemaker_session=model_builder.sagemaker_session,
+                model_name=model.name,
+                endpoint_name=model.endpoint_name,
+            )
+            if caught_ex:
+                logger.exception(caught_ex)
+                assert (
+                    False
+                ), f"{caught_ex} was thrown when running transformers sagemaker endpoint test"
+
+
+def test_model_builder_negative_path_with_invalid_task(sagemaker_session):
+    model_builder = ModelBuilder(
+        model="bert-base-uncased", model_metadata={"HF_TASK": "invalid-task"}
+    )
+
+    with pytest.raises(
+        TaskNotFoundException,
+        match="Error Message: Schema builder for invalid-task could not be found.",
+    ):
+        model_builder.build(sagemaker_session=sagemaker_session)
@@ -52,6 +52,20 @@
     "some-other-key": {"some-key": "some-value"},
 }
 
+DATA_SOURCE_UNIQUE_ID_TOO_LONG = """
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\
+"""
+
 DESCRIBE_FEATURE_GROUP_RESPONSE = {
     "FeatureGroupArn": INPUT_FEATURE_GROUP_ARN,
     "FeatureGroupName": INPUT_FEATURE_GROUP_NAME,
 
@@ -19,8 +19,6 @@
 import pytest
 
 import test_data_helpers as tdh
-import string
-import random
 from mock import Mock
 
 from sagemaker.feature_store.feature_processor._validation import (
@@ -164,7 +162,7 @@ def invalid_spark_position(spark, fg_data_source, s3_data_source):
         ("", "unique_id", "data_source_name of input does not match pattern '.*'."),
         (
             "source",
-            "".join(random.choices(string.ascii_uppercase, k=2050)),
+            tdh.DATA_SOURCE_UNIQUE_ID_TOO_LONG,
             "data_source_unique_id of input does not match pattern '.*'.",
         ),
         ("source", "", "data_source_unique_id of input does not match pattern '.*'."),
 
@@ -39,7 +39,6 @@
 
 from sagemaker.workflow.function_step import _FunctionStep, DelayedReturn
 from sagemaker.workflow.parameters import ParameterFloat
-from sagemaker.utils import sagemaker_timestamp
 
 from tests.unit.sagemaker.experiments.helpers import (
     TEST_EXP_DISPLAY_NAME,
@@ -55,7 +54,7 @@
 FUNCTION_FOLDER = "function"
 ARGUMENT_FOLDER = "arguments"
 RESULT_FOLDER = "results"
-PIPELINE_BUILD_TIME = sagemaker_timestamp()
+PIPELINE_BUILD_TIME = "2022-05-10T17:30:20Z"
 
 mock_s3 = {}
Original file line number	Diff line number	Diff line change
`@@ -1,28 +1,28 @@`
`1`	`1`	`{`
`2`	`2`	`"fill-mask": {`
`3`		`- "sample_inputs": {`
	`3`	`+ "sample_inputs": {`
`4`	`4`	`"properties": {`
`5`	`5`	`"inputs": "Paris is the [MASK] of France.",`
`6`	`6`	`"parameters": {}`
`7`	`7`	`}`
`8`		`- },`
`9`		`- "sample_outputs": {`
	`8`	`+ },`
	`9`	`+ "sample_outputs": {`
`10`	`10`	`"properties": [`
`11`	`11`	`{`
`12`	`12`	`"sequence": "Paris is the capital of France.",`
`13`	`13`	`"score": 0.7`
`14`	`14`	`}`
`15`	`15`	`]`
`16`	`16`	`}`
`17`		`- },`
	`17`	`+ },`
`18`	`18`	`"question-answering": {`
`19`		`- "sample_inputs": {`
	`19`	`+ "sample_inputs": {`
`20`	`20`	`"properties": {`
`21`	`21`	`"context": "I have a German Shepherd dog, named Coco.",`
`22`	`22`	`"question": "What is my dog's breed?"`
`23`	`23`	`}`
`24`		`- },`
`25`		`- "sample_outputs": {`
	`24`	`+ },`
	`25`	`+ "sample_outputs": {`
`26`	`26`	`"properties": [`
`27`	`27`	`{`
`28`	`28`	`"answer": "German Shepherd",`
`@@ -32,36 +32,36 @@`
`32`	`32`	`}`
`33`	`33`	`]`
`34`	`34`	`}`
`35`		`- },`
	`35`	`+ },`
`36`	`36`	`"text-classification": {`
`37`		`- "sample_inputs": {`
	`37`	`+ "sample_inputs": {`
`38`	`38`	`"properties": {`
`39`	`39`	`"inputs": "Where is the capital of France?, Paris is the capital of France.",`
`40`	`40`	`"parameters": {}`
`41`	`41`	`}`
`42`		`- },`
`43`		`- "sample_outputs": {`
	`42`	`+ },`
	`43`	`+ "sample_outputs": {`
`44`	`44`	`"properties": [`
`45`	`45`	`{`
`46`	`46`	`"label": "entailment",`
`47`	`47`	`"score": 0.997`
`48`	`48`	`}`
`49`	`49`	`]`
`50`	`50`	`}`
`51`		`- },`
`52`		`- "text-generation": {`
`53`		`- "sample_inputs": {`
	`51`	`+ },`
	`52`	`+ "text-generation": {`
	`53`	`+ "sample_inputs": {`
`54`	`54`	`"properties": {`
`55`	`55`	`"inputs": "Hello, I'm a language model",`
`56`	`56`	`"parameters": {}`
`57`	`57`	`}`
`58`		`- },`
`59`		`- "sample_outputs": {`
	`58`	`+ },`
	`59`	`+ "sample_outputs": {`
`60`	`60`	`"properties": [`
`61`		`- {`
`62`		`- "generated_text": "Hello, I'm a language modeler. So while writing this, when I went out to meet my wife or come home she told me that my"`
`63`		`- }`
	`61`	`+ {`
	`62`	`+ "generated_text": "Hello, I'm a language modeler. So while writing this, when I went out to meet my wife or come home she told me that my"`
	`63`	`+ }`
`64`	`64`	`]`
`65`	`65`	`}`
`66`		`- }`
	`66`	`+ }`
`67`	`67`	`}`