Skip to content

Commit 961af9b

Browse files
author
awstools
committed
feat(client-application-auto-scaling): Application Auto Scaling is now more responsive to the changes in demand of your SageMaker Inference endpoints. To get started, create or update a Target Tracking policy based on High Resolution CloudWatch metrics.
1 parent 45cb022 commit 961af9b

File tree

4 files changed

+17
-2
lines changed

4 files changed

+17
-2
lines changed

clients/client-application-auto-scaling/src/commands/DescribeScalingPoliciesCommand.ts

+1-1
Original file line numberDiff line numberDiff line change
@@ -79,7 +79,7 @@ export interface DescribeScalingPoliciesCommandOutput extends DescribeScalingPol
7979
* // TargetTrackingScalingPolicyConfiguration: { // TargetTrackingScalingPolicyConfiguration
8080
* // TargetValue: Number("double"), // required
8181
* // PredefinedMetricSpecification: { // PredefinedMetricSpecification
82-
* // PredefinedMetricType: "DynamoDBReadCapacityUtilization" || "DynamoDBWriteCapacityUtilization" || "ALBRequestCountPerTarget" || "RDSReaderAverageCPUUtilization" || "RDSReaderAverageDatabaseConnections" || "EC2SpotFleetRequestAverageCPUUtilization" || "EC2SpotFleetRequestAverageNetworkIn" || "EC2SpotFleetRequestAverageNetworkOut" || "SageMakerVariantInvocationsPerInstance" || "ECSServiceAverageCPUUtilization" || "ECSServiceAverageMemoryUtilization" || "AppStreamAverageCapacityUtilization" || "ComprehendInferenceUtilization" || "LambdaProvisionedConcurrencyUtilization" || "CassandraReadCapacityUtilization" || "CassandraWriteCapacityUtilization" || "KafkaBrokerStorageUtilization" || "ElastiCachePrimaryEngineCPUUtilization" || "ElastiCacheReplicaEngineCPUUtilization" || "ElastiCacheDatabaseMemoryUsageCountedForEvictPercentage" || "NeptuneReaderAverageCPUUtilization" || "SageMakerVariantProvisionedConcurrencyUtilization" || "ElastiCacheDatabaseCapacityUsageCountedForEvictPercentage" || "SageMakerInferenceComponentInvocationsPerCopy" || "WorkSpacesAverageUserSessionsCapacityUtilization", // required
82+
* // PredefinedMetricType: "DynamoDBReadCapacityUtilization" || "DynamoDBWriteCapacityUtilization" || "ALBRequestCountPerTarget" || "RDSReaderAverageCPUUtilization" || "RDSReaderAverageDatabaseConnections" || "EC2SpotFleetRequestAverageCPUUtilization" || "EC2SpotFleetRequestAverageNetworkIn" || "EC2SpotFleetRequestAverageNetworkOut" || "SageMakerVariantInvocationsPerInstance" || "ECSServiceAverageCPUUtilization" || "ECSServiceAverageMemoryUtilization" || "AppStreamAverageCapacityUtilization" || "ComprehendInferenceUtilization" || "LambdaProvisionedConcurrencyUtilization" || "CassandraReadCapacityUtilization" || "CassandraWriteCapacityUtilization" || "KafkaBrokerStorageUtilization" || "ElastiCachePrimaryEngineCPUUtilization" || "ElastiCacheReplicaEngineCPUUtilization" || "ElastiCacheDatabaseMemoryUsageCountedForEvictPercentage" || "NeptuneReaderAverageCPUUtilization" || "SageMakerVariantProvisionedConcurrencyUtilization" || "ElastiCacheDatabaseCapacityUsageCountedForEvictPercentage" || "SageMakerInferenceComponentInvocationsPerCopy" || "WorkSpacesAverageUserSessionsCapacityUtilization" || "SageMakerInferenceComponentConcurrentRequestsPerCopyHighResolution" || "SageMakerVariantConcurrentRequestsPerModelHighResolution", // required
8383
* // ResourceLabel: "STRING_VALUE",
8484
* // },
8585
* // CustomizedMetricSpecification: { // CustomizedMetricSpecification

clients/client-application-auto-scaling/src/commands/PutScalingPolicyCommand.ts

+1-1
Original file line numberDiff line numberDiff line change
@@ -85,7 +85,7 @@ export interface PutScalingPolicyCommandOutput extends PutScalingPolicyResponse,
8585
* TargetTrackingScalingPolicyConfiguration: { // TargetTrackingScalingPolicyConfiguration
8686
* TargetValue: Number("double"), // required
8787
* PredefinedMetricSpecification: { // PredefinedMetricSpecification
88-
* PredefinedMetricType: "DynamoDBReadCapacityUtilization" || "DynamoDBWriteCapacityUtilization" || "ALBRequestCountPerTarget" || "RDSReaderAverageCPUUtilization" || "RDSReaderAverageDatabaseConnections" || "EC2SpotFleetRequestAverageCPUUtilization" || "EC2SpotFleetRequestAverageNetworkIn" || "EC2SpotFleetRequestAverageNetworkOut" || "SageMakerVariantInvocationsPerInstance" || "ECSServiceAverageCPUUtilization" || "ECSServiceAverageMemoryUtilization" || "AppStreamAverageCapacityUtilization" || "ComprehendInferenceUtilization" || "LambdaProvisionedConcurrencyUtilization" || "CassandraReadCapacityUtilization" || "CassandraWriteCapacityUtilization" || "KafkaBrokerStorageUtilization" || "ElastiCachePrimaryEngineCPUUtilization" || "ElastiCacheReplicaEngineCPUUtilization" || "ElastiCacheDatabaseMemoryUsageCountedForEvictPercentage" || "NeptuneReaderAverageCPUUtilization" || "SageMakerVariantProvisionedConcurrencyUtilization" || "ElastiCacheDatabaseCapacityUsageCountedForEvictPercentage" || "SageMakerInferenceComponentInvocationsPerCopy" || "WorkSpacesAverageUserSessionsCapacityUtilization", // required
88+
* PredefinedMetricType: "DynamoDBReadCapacityUtilization" || "DynamoDBWriteCapacityUtilization" || "ALBRequestCountPerTarget" || "RDSReaderAverageCPUUtilization" || "RDSReaderAverageDatabaseConnections" || "EC2SpotFleetRequestAverageCPUUtilization" || "EC2SpotFleetRequestAverageNetworkIn" || "EC2SpotFleetRequestAverageNetworkOut" || "SageMakerVariantInvocationsPerInstance" || "ECSServiceAverageCPUUtilization" || "ECSServiceAverageMemoryUtilization" || "AppStreamAverageCapacityUtilization" || "ComprehendInferenceUtilization" || "LambdaProvisionedConcurrencyUtilization" || "CassandraReadCapacityUtilization" || "CassandraWriteCapacityUtilization" || "KafkaBrokerStorageUtilization" || "ElastiCachePrimaryEngineCPUUtilization" || "ElastiCacheReplicaEngineCPUUtilization" || "ElastiCacheDatabaseMemoryUsageCountedForEvictPercentage" || "NeptuneReaderAverageCPUUtilization" || "SageMakerVariantProvisionedConcurrencyUtilization" || "ElastiCacheDatabaseCapacityUsageCountedForEvictPercentage" || "SageMakerInferenceComponentInvocationsPerCopy" || "WorkSpacesAverageUserSessionsCapacityUtilization" || "SageMakerInferenceComponentConcurrentRequestsPerCopyHighResolution" || "SageMakerVariantConcurrentRequestsPerModelHighResolution", // required
8989
* ResourceLabel: "STRING_VALUE",
9090
* },
9191
* CustomizedMetricSpecification: { // CustomizedMetricSpecification

clients/client-application-auto-scaling/src/models/models_0.ts

+3
Original file line numberDiff line numberDiff line change
@@ -2534,7 +2534,10 @@ export const MetricType = {
25342534
NeptuneReaderAverageCPUUtilization: "NeptuneReaderAverageCPUUtilization",
25352535
RDSReaderAverageCPUUtilization: "RDSReaderAverageCPUUtilization",
25362536
RDSReaderAverageDatabaseConnections: "RDSReaderAverageDatabaseConnections",
2537+
SageMakerInferenceComponentConcurrentRequestsPerCopyHighResolution:
2538+
"SageMakerInferenceComponentConcurrentRequestsPerCopyHighResolution",
25372539
SageMakerInferenceComponentInvocationsPerCopy: "SageMakerInferenceComponentInvocationsPerCopy",
2540+
SageMakerVariantConcurrentRequestsPerModelHighResolution: "SageMakerVariantConcurrentRequestsPerModelHighResolution",
25382541
SageMakerVariantInvocationsPerInstance: "SageMakerVariantInvocationsPerInstance",
25392542
SageMakerVariantProvisionedConcurrencyUtilization: "SageMakerVariantProvisionedConcurrencyUtilization",
25402543
WorkSpacesAverageUserSessionsCapacityUtilization: "WorkSpacesAverageUserSessionsCapacityUtilization",

codegen/sdk-codegen/aws-models/application-auto-scaling.json

+12
Original file line numberDiff line numberDiff line change
@@ -2379,6 +2379,18 @@
23792379
"traits": {
23802380
"smithy.api#enumValue": "WorkSpacesAverageUserSessionsCapacityUtilization"
23812381
}
2382+
},
2383+
"SageMakerInferenceComponentConcurrentRequestsPerCopyHighResolution": {
2384+
"target": "smithy.api#Unit",
2385+
"traits": {
2386+
"smithy.api#enumValue": "SageMakerInferenceComponentConcurrentRequestsPerCopyHighResolution"
2387+
}
2388+
},
2389+
"SageMakerVariantConcurrentRequestsPerModelHighResolution": {
2390+
"target": "smithy.api#Unit",
2391+
"traits": {
2392+
"smithy.api#enumValue": "SageMakerVariantConcurrentRequestsPerModelHighResolution"
2393+
}
23822394
}
23832395
}
23842396
},

0 commit comments

Comments
 (0)