Skip to content

Commit 3ef9a90

Browse files
author
AWS
committed
Amazon SageMaker Service Update: Idle resource sharing enables teams to borrow unused compute resources in your SageMaker HyperPod cluster. This capability maximizes resource utilization by allowing teams to borrow idle compute capacity beyond their allocated compute quotas.
1 parent dad003b commit 3ef9a90

2 files changed

Lines changed: 45 additions & 1 deletion

File tree

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
{
2+
"type": "feature",
3+
"category": "Amazon SageMaker Service",
4+
"contributor": "",
5+
"description": "Idle resource sharing enables teams to borrow unused compute resources in your SageMaker HyperPod cluster. This capability maximizes resource utilization by allowing teams to borrow idle compute capacity beyond their allocated compute quotas."
6+
}

services/sagemaker/src/main/resources/codegen-resources/service-2.json

Lines changed: 39 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4689,6 +4689,12 @@
46894689
}
46904690
},
46914691
"shapes":{
4692+
"AbsoluteBorrowLimitResourceList":{
4693+
"type":"list",
4694+
"member":{"shape":"ComputeQuotaResourceConfig"},
4695+
"max":15,
4696+
"min":0
4697+
},
46924698
"AcceleratorPartitionConfig":{
46934699
"type":"structure",
46944700
"required":[
@@ -7761,7 +7767,7 @@
77617767
"BorrowLimit":{
77627768
"type":"integer",
77637769
"box":true,
7764-
"max":500,
7770+
"max":10000,
77657771
"min":0
77667772
},
77677773
"Branch":{
@@ -16625,6 +16631,10 @@
1662516631
"shape":"FailureReason",
1662616632
"documentation":"<p>Failure reason of the cluster policy.</p>"
1662716633
},
16634+
"StatusDetails":{
16635+
"shape":"StatusDetailsMap",
16636+
"documentation":"<p>Additional details about the status of the cluster policy. This field provides context when the policy is in a non-active state, such as during creation, updates, or if failures occur.</p>"
16637+
},
1662816638
"ClusterArn":{
1662916639
"shape":"ClusterArn",
1663016640
"documentation":"<p>ARN of the cluster where the cluster policy is applied.</p>"
@@ -25315,6 +25325,13 @@
2531525325
"max":20,
2531625326
"min":0
2531725327
},
25328+
"IdleResourceSharing":{
25329+
"type":"string",
25330+
"enum":[
25331+
"Enabled",
25332+
"Disabled"
25333+
]
25334+
},
2531825335
"IdleSettings":{
2531925336
"type":"structure",
2532025337
"members":{
@@ -40137,6 +40154,10 @@
4013740154
"BorrowLimit":{
4013840155
"shape":"BorrowLimit",
4013940156
"documentation":"<p>The limit on how much idle compute can be borrowed.The values can be 1 - 500 percent of idle compute that the team is allowed to borrow.</p> <p>Default is <code>50</code>.</p>"
40157+
},
40158+
"AbsoluteBorrowLimits":{
40159+
"shape":"AbsoluteBorrowLimitResourceList",
40160+
"documentation":"<p>The absolute limits on compute resources that can be borrowed from idle compute. When specified, these limits define the maximum amount of specific resource types (such as accelerators, vCPU, or memory) that an entity can borrow, regardless of the percentage-based <code>BorrowLimit</code>.</p>"
4014040161
}
4014140162
},
4014240163
"documentation":"<p>Resource sharing configuration.</p>"
@@ -40714,10 +40735,22 @@
4071440735
"FairShare":{
4071540736
"shape":"FairShare",
4071640737
"documentation":"<p>When enabled, entities borrow idle compute based on their assigned <code>FairShareWeight</code>.</p> <p>When disabled, entities borrow idle compute based on a first-come first-serve basis.</p> <p>Default is <code>Enabled</code>.</p>"
40738+
},
40739+
"IdleResourceSharing":{
40740+
"shape":"IdleResourceSharing",
40741+
"documentation":"<p>Configuration for sharing idle compute resources across entities in the cluster. When enabled, unallocated resources are automatically calculated and made available for entities to borrow. </p>"
4071740742
}
4071840743
},
4071940744
"documentation":"<p>Cluster policy configuration. This policy is used for task prioritization and fair-share allocation. This helps prioritize critical workloads and distributes idle compute across entities.</p>"
4072040745
},
40746+
"SchedulerConfigComponent":{
40747+
"type":"string",
40748+
"enum":[
40749+
"PriorityClasses",
40750+
"FairShare",
40751+
"IdleResourceSharing"
40752+
]
40753+
},
4072140754
"SchedulerResourceStatus":{
4072240755
"type":"string",
4072340756
"enum":[
@@ -41994,6 +42027,11 @@
4199442027
"min":0,
4199542028
"pattern":".*"
4199642029
},
42030+
"StatusDetailsMap":{
42031+
"type":"map",
42032+
"key":{"shape":"SchedulerConfigComponent"},
42033+
"value":{"shape":"SchedulerResourceStatus"}
42034+
},
4199742035
"StatusMessage":{"type":"string"},
4199842036
"StepDescription":{
4199942037
"type":"string",

0 commit comments

Comments
 (0)