|
11187 | 11187 | "InferenceRecommendations":{
|
11188 | 11188 | "shape":"InferenceRecommendations",
|
11189 | 11189 | "documentation":"<p>The recommendations made by Inference Recommender.</p>"
|
| 11190 | + }, |
| 11191 | + "EndpointPerformances":{ |
| 11192 | + "shape":"EndpointPerformances", |
| 11193 | + "documentation":"<p>The performance results from running an Inference Recommender job on an existing endpoint.</p>" |
11190 | 11194 | }
|
11191 | 11195 | }
|
11192 | 11196 | },
|
|
13893 | 13897 | "type":"list",
|
13894 | 13898 | "member":{"shape":"EndpointConfigSummary"}
|
13895 | 13899 | },
|
| 13900 | + "EndpointInfo":{ |
| 13901 | + "type":"structure", |
| 13902 | + "required":["EndpointName"], |
| 13903 | + "members":{ |
| 13904 | + "EndpointName":{ |
| 13905 | + "shape":"EndpointName", |
| 13906 | + "documentation":"<p>The name of a customer's endpoint.</p>" |
| 13907 | + } |
| 13908 | + }, |
| 13909 | + "documentation":"<p>Details about a customer endpoint that was compared in an Inference Recommender job.</p>" |
| 13910 | + }, |
13896 | 13911 | "EndpointInput":{
|
13897 | 13912 | "type":"structure",
|
13898 | 13913 | "required":[
|
|
14006 | 14021 | },
|
14007 | 14022 | "documentation":"<p>The endpoint configuration made by Inference Recommender during a recommendation job.</p>"
|
14008 | 14023 | },
|
| 14024 | + "EndpointPerformance":{ |
| 14025 | + "type":"structure", |
| 14026 | + "required":[ |
| 14027 | + "Metrics", |
| 14028 | + "EndpointInfo" |
| 14029 | + ], |
| 14030 | + "members":{ |
| 14031 | + "Metrics":{ |
| 14032 | + "shape":"InferenceMetrics", |
| 14033 | + "documentation":"<p>The metrics for an existing endpoint.</p>" |
| 14034 | + }, |
| 14035 | + "EndpointInfo":{"shape":"EndpointInfo"} |
| 14036 | + }, |
| 14037 | + "documentation":"<p>The performance results from running an Inference Recommender job on an existing endpoint.</p>" |
| 14038 | + }, |
| 14039 | + "EndpointPerformances":{ |
| 14040 | + "type":"list", |
| 14041 | + "member":{"shape":"EndpointPerformance"}, |
| 14042 | + "max":1 |
| 14043 | + }, |
14009 | 14044 | "EndpointSortKey":{
|
14010 | 14045 | "type":"string",
|
14011 | 14046 | "enum":[
|
|
14064 | 14099 | "type":"list",
|
14065 | 14100 | "member":{"shape":"EndpointSummary"}
|
14066 | 14101 | },
|
| 14102 | + "Endpoints":{ |
| 14103 | + "type":"list", |
| 14104 | + "member":{"shape":"EndpointInfo"}, |
| 14105 | + "max":1 |
| 14106 | + }, |
14067 | 14107 | "EntityDescription":{
|
14068 | 14108 | "type":"string",
|
14069 | 14109 | "max":1024,
|
|
16115 | 16155 | "type":"string",
|
16116 | 16156 | "max":256
|
16117 | 16157 | },
|
| 16158 | + "InferenceMetrics":{ |
| 16159 | + "type":"structure", |
| 16160 | + "required":[ |
| 16161 | + "MaxInvocations", |
| 16162 | + "ModelLatency" |
| 16163 | + ], |
| 16164 | + "members":{ |
| 16165 | + "MaxInvocations":{ |
| 16166 | + "shape":"Integer", |
| 16167 | + "documentation":"<p>The expected maximum number of requests per minute for the instance.</p>" |
| 16168 | + }, |
| 16169 | + "ModelLatency":{ |
| 16170 | + "shape":"Integer", |
| 16171 | + "documentation":"<p>The expected model latency at maximum invocations per minute for the instance.</p>" |
| 16172 | + } |
| 16173 | + }, |
| 16174 | + "documentation":"<p>The metrics for an existing endpoint compared in an Inference Recommender job.</p>" |
| 16175 | + }, |
16118 | 16176 | "InferenceRecommendation":{
|
16119 | 16177 | "type":"structure",
|
16120 | 16178 | "required":[
|
|
24623 | 24681 | "ContainerConfig":{
|
24624 | 24682 | "shape":"RecommendationJobContainerConfig",
|
24625 | 24683 | "documentation":"<p>Specifies mandatory fields for running an Inference Recommender job. The fields specified in <code>ContainerConfig</code> override the corresponding fields in the model package.</p>"
|
| 24684 | + }, |
| 24685 | + "Endpoints":{ |
| 24686 | + "shape":"Endpoints", |
| 24687 | + "documentation":"<p>Existing customer endpoints on which to run an Inference Recommender job.</p>" |
24626 | 24688 | }
|
24627 | 24689 | },
|
24628 | 24690 | "documentation":"<p>The input configuration of the recommendation job.</p>"
|
|
27345 | 27407 | },
|
27346 | 27408 | "InstanceCount":{
|
27347 | 27409 | "shape":"TransformInstanceCount",
|
27348 |
| - "documentation":"<p>The number of ML compute instances to use in the transform job. For distributed transform jobs, specify a value greater than 1. The default value is <code>1</code>.</p>" |
| 27410 | + "documentation":"<p>The number of ML compute instances to use in the transform job. The default value is <code>1</code>, and the maximum is <code>100</code>. For distributed transform jobs, specify a value greater than <code>1</code>.</p>" |
27349 | 27411 | },
|
27350 | 27412 | "VolumeKmsKeyId":{
|
27351 | 27413 | "shape":"KmsKeyId",
|
|
0 commit comments