Skip to content

Commit 7cc3c3a

Browse files
Release new parameter CapacityReservationConfig in ProductionVariant
1 parent 143d899 commit 7cc3c3a

20 files changed

+1120
-4
lines changed

generator/ServiceModels/sagemaker/sagemaker-2017-07-24.api.json

Lines changed: 48 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -5859,6 +5859,10 @@
58595859
"EmrServerlessSettings":{"shape":"EmrServerlessSettings"}
58605860
}
58615861
},
5862+
"CapacityReservationPreference":{
5863+
"type":"string",
5864+
"enum":["capacity-reservations-only"]
5865+
},
58625866
"CapacitySize":{
58635867
"type":"structure",
58645868
"required":[
@@ -12538,6 +12542,20 @@
1253812542
"EbsVolumeSizeInGb":{"shape":"SpaceEbsVolumeSizeInGb"}
1253912543
}
1254012544
},
12545+
"Ec2CapacityReservation":{
12546+
"type":"structure",
12547+
"members":{
12548+
"Ec2CapacityReservationId":{"shape":"Ec2CapacityReservationId"},
12549+
"TotalInstanceCount":{"shape":"TaskCount"},
12550+
"AvailableInstanceCount":{"shape":"TaskCount"},
12551+
"UsedByCurrentEndpoint":{"shape":"TaskCount"}
12552+
}
12553+
},
12554+
"Ec2CapacityReservationId":{"type":"string"},
12555+
"Ec2CapacityReservationsList":{
12556+
"type":"list",
12557+
"member":{"shape":"Ec2CapacityReservation"}
12558+
},
1254112559
"Edge":{
1254212560
"type":"structure",
1254312561
"members":{
@@ -18296,6 +18314,12 @@
1829618314
"min":0,
1829718315
"pattern":"1|2"
1829818316
},
18317+
"MlReservationArn":{
18318+
"type":"string",
18319+
"max":258,
18320+
"min":20,
18321+
"pattern":"arn:aws[a-z\\-]*:sagemaker:[a-z0-9\\-]*:[0-9]{12}:ml-reservation/.*"
18322+
},
1829918323
"MlTools":{
1830018324
"type":"string",
1830118325
"enum":[
@@ -21437,7 +21461,8 @@
2143721461
"EnableSSMAccess":{"shape":"ProductionVariantSSMAccess"},
2143821462
"ManagedInstanceScaling":{"shape":"ProductionVariantManagedInstanceScaling"},
2143921463
"RoutingConfig":{"shape":"ProductionVariantRoutingConfig"},
21440-
"InferenceAmiVersion":{"shape":"ProductionVariantInferenceAmiVersion"}
21464+
"InferenceAmiVersion":{"shape":"ProductionVariantInferenceAmiVersion"},
21465+
"CapacityReservationConfig":{"shape":"ProductionVariantCapacityReservationConfig"}
2144121466
}
2144221467
},
2144321468
"ProductionVariantAcceleratorType":{
@@ -21451,6 +21476,24 @@
2145121476
"ml.eia2.xlarge"
2145221477
]
2145321478
},
21479+
"ProductionVariantCapacityReservationConfig":{
21480+
"type":"structure",
21481+
"members":{
21482+
"CapacityReservationPreference":{"shape":"CapacityReservationPreference"},
21483+
"MlReservationArn":{"shape":"MlReservationArn"}
21484+
}
21485+
},
21486+
"ProductionVariantCapacityReservationSummary":{
21487+
"type":"structure",
21488+
"members":{
21489+
"MlReservationArn":{"shape":"MlReservationArn"},
21490+
"CapacityReservationPreference":{"shape":"CapacityReservationPreference"},
21491+
"TotalInstanceCount":{"shape":"TaskCount"},
21492+
"AvailableInstanceCount":{"shape":"TaskCount"},
21493+
"UsedByCurrentEndpoint":{"shape":"TaskCount"},
21494+
"Ec2CapacityReservations":{"shape":"Ec2CapacityReservationsList"}
21495+
}
21496+
},
2145421497
"ProductionVariantContainerStartupHealthCheckTimeoutInSeconds":{
2145521498
"type":"integer",
2145621499
"box":true,
@@ -21782,7 +21825,8 @@
2178221825
"CurrentServerlessConfig":{"shape":"ProductionVariantServerlessConfig"},
2178321826
"DesiredServerlessConfig":{"shape":"ProductionVariantServerlessConfig"},
2178421827
"ManagedInstanceScaling":{"shape":"ProductionVariantManagedInstanceScaling"},
21785-
"RoutingConfig":{"shape":"ProductionVariantRoutingConfig"}
21828+
"RoutingConfig":{"shape":"ProductionVariantRoutingConfig"},
21829+
"CapacityReservationConfig":{"shape":"ProductionVariantCapacityReservationSummary"}
2178621830
}
2178721831
},
2178821832
"ProductionVariantSummaryList":{
@@ -26120,7 +26164,8 @@
2612026164
"DomainId":{"shape":"UnifiedStudioDomainId"},
2612126165
"ProjectId":{"shape":"UnifiedStudioProjectId"},
2612226166
"EnvironmentId":{"shape":"UnifiedStudioEnvironmentId"},
26123-
"ProjectS3Path":{"shape":"S3Uri"}
26167+
"ProjectS3Path":{"shape":"S3Uri"},
26168+
"SingleSignOnApplicationArn":{"shape":"SingleSignOnApplicationArn"}
2612426169
}
2612526170
},
2612626171
"UpdateActionRequest":{

generator/ServiceModels/sagemaker/sagemaker-2017-07-24.docs.json

Lines changed: 52 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1812,6 +1812,13 @@
18121812
"UserSettings$CanvasAppSettings": "<p>The Canvas app settings.</p> <p>SageMaker applies these settings only to private spaces that SageMaker creates for the Canvas app.</p>"
18131813
}
18141814
},
1815+
"CapacityReservationPreference": {
1816+
"base": null,
1817+
"refs": {
1818+
"ProductionVariantCapacityReservationConfig$CapacityReservationPreference": "<p>Options that you can choose for the capacity reservation. SageMaker AI supports the following options:</p> <dl> <dt>capacity-reservations-only</dt> <dd> <p>SageMaker AI launches instances only into an ML capacity reservation. If no capacity is available, the instances fail to launch.</p> </dd> </dl>",
1819+
"ProductionVariantCapacityReservationSummary$CapacityReservationPreference": "<p>The option that you chose for the capacity reservation. SageMaker AI supports the following options:</p> <dl> <dt>capacity-reservations-only</dt> <dd> <p>SageMaker AI launches instances only into an ML capacity reservation. If no capacity is available, the instances fail to launch.</p> </dd> </dl>"
1820+
}
1821+
},
18151822
"CapacitySize": {
18161823
"base": "<p>Specifies the type and size of the endpoint capacity to activate for a blue/green deployment, a rolling deployment, or a rollback strategy. You can specify your batches as either instance count or the overall percentage or your fleet.</p> <p>For a rollback strategy, if you don't specify the fields in this object, or if you set the <code>Value</code> to 100%, then SageMaker uses a blue/green rollback strategy and rolls all traffic back to the blue fleet.</p>",
18171824
"refs": {
@@ -5562,6 +5569,24 @@
55625569
"SpaceStorageSettings$EbsStorageSettings": "<p>A collection of EBS storage settings for a space.</p>"
55635570
}
55645571
},
5572+
"Ec2CapacityReservation": {
5573+
"base": "<p>The EC2 capacity reservations that are shared to an ML capacity reservation.</p>",
5574+
"refs": {
5575+
"Ec2CapacityReservationsList$member": null
5576+
}
5577+
},
5578+
"Ec2CapacityReservationId": {
5579+
"base": null,
5580+
"refs": {
5581+
"Ec2CapacityReservation$Ec2CapacityReservationId": "<p>The unique identifier for an EC2 capacity reservation that's part of the ML capacity reservation.</p>"
5582+
}
5583+
},
5584+
"Ec2CapacityReservationsList": {
5585+
"base": null,
5586+
"refs": {
5587+
"ProductionVariantCapacityReservationSummary$Ec2CapacityReservations": "<p>The EC2 capacity reservations that are shared to this ML capacity reservation, if any.</p>"
5588+
}
5589+
},
55655590
"Edge": {
55665591
"base": "<p>A directed edge connecting two lineage entities.</p>",
55675592
"refs": {
@@ -10398,6 +10423,13 @@
1039810423
"InstanceMetadataServiceConfiguration$MinimumInstanceMetadataServiceVersion": "<p>Indicates the minimum IMDS version that the notebook instance supports. When passed as part of <code>CreateNotebookInstance</code>, if no value is selected, then it defaults to IMDSv1. This means that both IMDSv1 and IMDSv2 are supported. If passed as part of <code>UpdateNotebookInstance</code>, there is no default.</p>"
1039910424
}
1040010425
},
10426+
"MlReservationArn": {
10427+
"base": null,
10428+
"refs": {
10429+
"ProductionVariantCapacityReservationConfig$MlReservationArn": "<p>The Amazon Resource Name (ARN) that uniquely identifies the ML capacity reservation that SageMaker AI applies when it deploys the endpoint.</p>",
10430+
"ProductionVariantCapacityReservationSummary$MlReservationArn": "<p>The Amazon Resource Name (ARN) that uniquely identifies the ML capacity reservation that SageMaker AI applies when it deploys the endpoint.</p>"
10431+
}
10432+
},
1040110433
"MlTools": {
1040210434
"base": null,
1040310435
"refs": {
@@ -13320,6 +13352,18 @@
1332013352
"ProductionVariant$AcceleratorType": "<p>This parameter is no longer supported. Elastic Inference (EI) is no longer available.</p> <p>This parameter was used to specify the size of the EI instance to use for the production variant.</p>"
1332113353
}
1332213354
},
13355+
"ProductionVariantCapacityReservationConfig": {
13356+
"base": "<p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>",
13357+
"refs": {
13358+
"ProductionVariant$CapacityReservationConfig": "<p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>"
13359+
}
13360+
},
13361+
"ProductionVariantCapacityReservationSummary": {
13362+
"base": "<p>Details about an ML capacity reservation.</p>",
13363+
"refs": {
13364+
"ProductionVariantSummary$CapacityReservationConfig": "<p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>"
13365+
}
13366+
},
1332313367
"ProductionVariantContainerStartupHealthCheckTimeoutInSeconds": {
1332413368
"base": null,
1332513369
"refs": {
@@ -15073,7 +15117,8 @@
1507315117
"SingleSignOnApplicationArn": {
1507415118
"base": null,
1507515119
"refs": {
15076-
"DescribeDomainResponse$SingleSignOnApplicationArn": "<p>The ARN of the application managed by SageMaker AI in IAM Identity Center. This value is only returned for domains created after October 1, 2023.</p>"
15120+
"DescribeDomainResponse$SingleSignOnApplicationArn": "<p>The ARN of the application managed by SageMaker AI in IAM Identity Center. This value is only returned for domains created after October 1, 2023.</p>",
15121+
"UnifiedStudioSettings$SingleSignOnApplicationArn": "<p>The ARN of the application managed by SageMaker AI and SageMaker Unified Studio in the Amazon Web Services IAM Identity Center.</p>"
1507715122
}
1507815123
},
1507915124
"SingleSignOnUserIdentifier": {
@@ -16204,8 +16249,14 @@
1620416249
"base": null,
1620516250
"refs": {
1620616251
"DesiredWeightAndCapacity$DesiredInstanceCount": "<p>The variant's capacity.</p>",
16252+
"Ec2CapacityReservation$TotalInstanceCount": "<p>The number of instances that you allocated to the EC2 capacity reservation.</p>",
16253+
"Ec2CapacityReservation$AvailableInstanceCount": "<p>The number of instances that are currently available in the EC2 capacity reservation.</p>",
16254+
"Ec2CapacityReservation$UsedByCurrentEndpoint": "<p>The number of instances from the EC2 capacity reservation that are being used by the endpoint.</p>",
1620716255
"PendingProductionVariantSummary$CurrentInstanceCount": "<p>The number of instances associated with the variant.</p>",
1620816256
"PendingProductionVariantSummary$DesiredInstanceCount": "<p>The number of instances requested in this deployment, as specified in the endpoint configuration for the endpoint. The value is taken from the request to the <a href=\"https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateEndpointConfig.html\">CreateEndpointConfig</a> operation.</p>",
16257+
"ProductionVariantCapacityReservationSummary$TotalInstanceCount": "<p>The number of instances that you allocated to the ML capacity reservation.</p>",
16258+
"ProductionVariantCapacityReservationSummary$AvailableInstanceCount": "<p>The number of instances that are currently available in the ML capacity reservation.</p>",
16259+
"ProductionVariantCapacityReservationSummary$UsedByCurrentEndpoint": "<p>The number of instances from the ML capacity reservation that are being used by the endpoint.</p>",
1620916260
"ProductionVariantSummary$CurrentInstanceCount": "<p>The number of instances associated with the variant.</p>",
1621016261
"ProductionVariantSummary$DesiredInstanceCount": "<p>The number of instances requested in the <code>UpdateEndpointWeightsAndCapacities</code> request. </p>",
1621116262
"RealTimeInferenceConfig$InstanceCount": "<p>The number of instances of the type specified by <code>InstanceType</code>.</p>"

generator/ServiceModels/sagemaker/sagemaker-2017-07-24.normal.json

Lines changed: 93 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7023,6 +7023,10 @@
70237023
},
70247024
"documentation":"<p>The SageMaker Canvas application settings.</p>"
70257025
},
7026+
"CapacityReservationPreference":{
7027+
"type":"string",
7028+
"enum":["capacity-reservations-only"]
7029+
},
70267030
"CapacitySize":{
70277031
"type":"structure",
70287032
"required":[
@@ -19326,6 +19330,33 @@
1932619330
},
1932719331
"documentation":"<p>A collection of EBS storage settings that apply to both private and shared spaces.</p>"
1932819332
},
19333+
"Ec2CapacityReservation":{
19334+
"type":"structure",
19335+
"members":{
19336+
"Ec2CapacityReservationId":{
19337+
"shape":"Ec2CapacityReservationId",
19338+
"documentation":"<p>The unique identifier for an EC2 capacity reservation that's part of the ML capacity reservation.</p>"
19339+
},
19340+
"TotalInstanceCount":{
19341+
"shape":"TaskCount",
19342+
"documentation":"<p>The number of instances that you allocated to the EC2 capacity reservation.</p>"
19343+
},
19344+
"AvailableInstanceCount":{
19345+
"shape":"TaskCount",
19346+
"documentation":"<p>The number of instances that are currently available in the EC2 capacity reservation.</p>"
19347+
},
19348+
"UsedByCurrentEndpoint":{
19349+
"shape":"TaskCount",
19350+
"documentation":"<p>The number of instances from the EC2 capacity reservation that are being used by the endpoint.</p>"
19351+
}
19352+
},
19353+
"documentation":"<p>The EC2 capacity reservations that are shared to an ML capacity reservation.</p>"
19354+
},
19355+
"Ec2CapacityReservationId":{"type":"string"},
19356+
"Ec2CapacityReservationsList":{
19357+
"type":"list",
19358+
"member":{"shape":"Ec2CapacityReservation"}
19359+
},
1932919360
"Edge":{
1933019361
"type":"structure",
1933119362
"members":{
@@ -29342,6 +29373,12 @@
2934229373
"min":0,
2934329374
"pattern":"1|2"
2934429375
},
29376+
"MlReservationArn":{
29377+
"type":"string",
29378+
"max":258,
29379+
"min":20,
29380+
"pattern":"arn:aws[a-z\\-]*:sagemaker:[a-z0-9\\-]*:[0-9]{12}:ml-reservation/.*"
29381+
},
2934529382
"MlTools":{
2934629383
"type":"string",
2934729384
"enum":[
@@ -34305,6 +34342,10 @@
3430534342
"InferenceAmiVersion":{
3430634343
"shape":"ProductionVariantInferenceAmiVersion",
3430734344
"documentation":"<p>Specifies an option from a collection of preconfigured Amazon Machine Image (AMI) images. Each image is configured by Amazon Web Services with a set of software and driver versions. Amazon Web Services optimizes these configurations for different machine learning workloads.</p> <p>By selecting an AMI version, you can ensure that your inference environment is compatible with specific software requirements, such as CUDA driver versions, Linux kernel versions, or Amazon Web Services Neuron driver versions.</p> <p>The AMI version names, and their configurations, are the following:</p> <dl> <dt>al2-ami-sagemaker-inference-gpu-2</dt> <dd> <ul> <li> <p>Accelerator: GPU</p> </li> <li> <p>NVIDIA driver version: 535</p> </li> <li> <p>CUDA version: 12.2</p> </li> </ul> </dd> <dt>al2-ami-sagemaker-inference-gpu-2-1</dt> <dd> <ul> <li> <p>Accelerator: GPU</p> </li> <li> <p>NVIDIA driver version: 535</p> </li> <li> <p>CUDA version: 12.2</p> </li> <li> <p>NVIDIA Container Toolkit with disabled CUDA-compat mounting</p> </li> </ul> </dd> <dt>al2-ami-sagemaker-inference-gpu-3-1</dt> <dd> <ul> <li> <p>Accelerator: GPU</p> </li> <li> <p>NVIDIA driver version: 550</p> </li> <li> <p>CUDA version: 12.4</p> </li> <li> <p>NVIDIA Container Toolkit with disabled CUDA-compat mounting</p> </li> </ul> </dd> <dt>al2-ami-sagemaker-inference-neuron-2</dt> <dd> <ul> <li> <p>Accelerator: Inferentia2 and Trainium</p> </li> <li> <p>Neuron driver version: 2.19</p> </li> </ul> </dd> </dl>"
34345+
},
34346+
"CapacityReservationConfig":{
34347+
"shape":"ProductionVariantCapacityReservationConfig",
34348+
"documentation":"<p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>"
3430834349
}
3430934350
},
3431034351
"documentation":"<p> Identifies a model that you want to host and the resources chosen to deploy for hosting it. If you are deploying multiple models, tell SageMaker how to distribute traffic among the models by specifying variant weights. For more information on production variants, check <a href=\"https://docs.aws.amazon.com/sagemaker/latest/dg/model-ab-testing.html\"> Production variants</a>. </p>"
@@ -34320,6 +34361,50 @@
3432034361
"ml.eia2.xlarge"
3432134362
]
3432234363
},
34364+
"ProductionVariantCapacityReservationConfig":{
34365+
"type":"structure",
34366+
"members":{
34367+
"CapacityReservationPreference":{
34368+
"shape":"CapacityReservationPreference",
34369+
"documentation":"<p>Options that you can choose for the capacity reservation. SageMaker AI supports the following options:</p> <dl> <dt>capacity-reservations-only</dt> <dd> <p>SageMaker AI launches instances only into an ML capacity reservation. If no capacity is available, the instances fail to launch.</p> </dd> </dl>"
34370+
},
34371+
"MlReservationArn":{
34372+
"shape":"MlReservationArn",
34373+
"documentation":"<p>The Amazon Resource Name (ARN) that uniquely identifies the ML capacity reservation that SageMaker AI applies when it deploys the endpoint.</p>"
34374+
}
34375+
},
34376+
"documentation":"<p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>"
34377+
},
34378+
"ProductionVariantCapacityReservationSummary":{
34379+
"type":"structure",
34380+
"members":{
34381+
"MlReservationArn":{
34382+
"shape":"MlReservationArn",
34383+
"documentation":"<p>The Amazon Resource Name (ARN) that uniquely identifies the ML capacity reservation that SageMaker AI applies when it deploys the endpoint.</p>"
34384+
},
34385+
"CapacityReservationPreference":{
34386+
"shape":"CapacityReservationPreference",
34387+
"documentation":"<p>The option that you chose for the capacity reservation. SageMaker AI supports the following options:</p> <dl> <dt>capacity-reservations-only</dt> <dd> <p>SageMaker AI launches instances only into an ML capacity reservation. If no capacity is available, the instances fail to launch.</p> </dd> </dl>"
34388+
},
34389+
"TotalInstanceCount":{
34390+
"shape":"TaskCount",
34391+
"documentation":"<p>The number of instances that you allocated to the ML capacity reservation.</p>"
34392+
},
34393+
"AvailableInstanceCount":{
34394+
"shape":"TaskCount",
34395+
"documentation":"<p>The number of instances that are currently available in the ML capacity reservation.</p>"
34396+
},
34397+
"UsedByCurrentEndpoint":{
34398+
"shape":"TaskCount",
34399+
"documentation":"<p>The number of instances from the ML capacity reservation that are being used by the endpoint.</p>"
34400+
},
34401+
"Ec2CapacityReservations":{
34402+
"shape":"Ec2CapacityReservationsList",
34403+
"documentation":"<p>The EC2 capacity reservations that are shared to this ML capacity reservation, if any.</p>"
34404+
}
34405+
},
34406+
"documentation":"<p>Details about an ML capacity reservation.</p>"
34407+
},
3432334408
"ProductionVariantContainerStartupHealthCheckTimeoutInSeconds":{
3432434409
"type":"integer",
3432534410
"box":true,
@@ -34732,6 +34817,10 @@
3473234817
"RoutingConfig":{
3473334818
"shape":"ProductionVariantRoutingConfig",
3473434819
"documentation":"<p>Settings that control how the endpoint routes incoming traffic to the instances that the endpoint hosts.</p>"
34820+
},
34821+
"CapacityReservationConfig":{
34822+
"shape":"ProductionVariantCapacityReservationSummary",
34823+
"documentation":"<p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>"
3473534824
}
3473634825
},
3473734826
"documentation":"<p>Describes weight and capacities for a production variant associated with an endpoint. If you sent a request to the <code>UpdateEndpointWeightsAndCapacities</code> API and the endpoint status is <code>Updating</code>, you get different desired and current values. </p>"
@@ -41161,6 +41250,10 @@
4116141250
"ProjectS3Path":{
4116241251
"shape":"S3Uri",
4116341252
"documentation":"<p>The location where Amazon S3 stores temporary execution data and other artifacts for the project that corresponds to the domain.</p>"
41253+
},
41254+
"SingleSignOnApplicationArn":{
41255+
"shape":"SingleSignOnApplicationArn",
41256+
"documentation":"<p>The ARN of the application managed by SageMaker AI and SageMaker Unified Studio in the Amazon Web Services IAM Identity Center.</p>"
4116441257
}
4116541258
},
4116641259
"documentation":"<p>The settings that apply to an Amazon SageMaker AI domain when you use it in Amazon SageMaker Unified Studio.</p>"

0 commit comments

Comments
 (0)