Skip to content

Commit 535f8e8

Browse files
lykelly19lykelly19
andauthored
Migrate deploymentOptions from tags to system metadata (#5062)
Co-authored-by: lykelly19 <kellyly@microsoft.com>
1 parent 5a369a2 commit 535f8e8

11 files changed

Lines changed: 65 additions & 11 deletions

File tree

assets/models/system/Phi-4/spec.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,12 @@ properties:
1111
finetune-recommended-sku: Standard_NC24ads_A100_v4, Standard_NC48ads_A100_v4, Standard_NC96ads_A100_v4, Standard_ND96asr_v4, Standard_ND96amsr_A100_v4, Standard_NC40ads_H100_v5, Standard_NC80adis_H100_v5, Standard_ND96isr_H100_v5
1212
languages: en
1313
SharedComputeCapacityEnabled: "True"
14+
system_metadata:
15+
deploymentOptions:
16+
- UnifiedEndpointMaaS
17+
- MaaP
18+
- ServerlessMaaS
19+
1420
tags:
1521
author: Microsoft
1622
SharedComputeCapacityEnabled: ""
@@ -37,7 +43,6 @@ tags:
3743
notes: "notes.md"
3844
hiddenlayerscanned: ""
3945
maas-inference: "true"
40-
deploymentOptions: "UnifiedEndpointMaaS, MaaP, ServerlessMaaS"
4146
inference_compute_allow_list:
4247
[
4348
Standard_NC24ads_A100_v4,

assets/models/system/phi-3-medium-128k-instruct/spec.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,12 @@ properties:
99
finetuning-tasks: chat-completion
1010
finetune-min-sku-spec: 96|4|880|256
1111
finetune-recommended-sku: Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4
12+
system_metadata:
13+
deploymentOptions:
14+
- UnifiedEndpointMaaS
15+
- MaaP
16+
- ServerlessMaaS
17+
1218
tags:
1319
InferenceLegacyDate: '2025-06-09'
1420
InferenceDeprecationDate: '2025-06-30'
@@ -31,7 +37,6 @@ tags:
3137
playgroundRateLimitTier: "low"
3238
Featured: ""
3339
maas-inference: "true"
34-
deploymentOptions: "UnifiedEndpointMaaS, MaaP, ServerlessMaaS"
3540
license: MIT
3641
disable-batch: "true"
3742
task: chat-completion

assets/models/system/phi-3-medium-4k-instruct/spec.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,12 @@ properties:
99
finetuning-tasks: chat-completion
1010
finetune-min-sku-spec: 96|4|880|256
1111
finetune-recommended-sku: Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4
12+
system_metadata:
13+
deploymentOptions:
14+
- UnifiedEndpointMaaS
15+
- MaaP
16+
- ServerlessMaaS
17+
1218
tags:
1319
InferenceLegacyDate: '2025-06-09'
1420
InferenceDeprecationDate: '2025-06-30'
@@ -32,7 +38,6 @@ tags:
3238
Featured: ""
3339
SharedComputeCapacityEnabled: ''
3440
maas-inference: "true"
35-
deploymentOptions: "UnifiedEndpointMaaS, MaaP, ServerlessMaaS"
3641
hiddenlayerscanned : ""
3742
license: MIT
3843
disable-batch: "true"

assets/models/system/phi-3-mini-128k-instruct/spec.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,12 @@ properties:
99
finetuning-tasks: chat-completion
1010
finetune-min-sku-spec: 24|1|220|64
1111
finetune-recommended-sku: Standard_NC24ads_A100_v4, Standard_NC48ads_A100_v4, Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4
12+
system_metadata:
13+
deploymentOptions:
14+
- UnifiedEndpointMaaS
15+
- MaaP
16+
- ServerlessMaaS
17+
1218
tags:
1319
InferenceLegacyDate: '2025-06-09'
1420
InferenceDeprecationDate: '2025-06-30'
@@ -31,7 +37,6 @@ tags:
3137
playgroundRateLimitTier: "low"
3238
Featured: ""
3339
maas-inference: "true"
34-
deploymentOptions: "UnifiedEndpointMaaS, MaaP, ServerlessMaaS"
3540
license: MIT
3641
disable-batch: "true"
3742
task: chat-completion

assets/models/system/phi-3-mini-4k-instruct/spec.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,12 @@ properties:
99
finetuning-tasks: chat-completion
1010
finetune-min-sku-spec: 24|1|220|64
1111
finetune-recommended-sku: Standard_NC24ads_A100_v4, Standard_NC48ads_A100_v4, Standard_NC96ads_A100_v4, Standard_ND96asr_v4, Standard_ND96amsr_A100_v4
12+
system_metadata:
13+
deploymentOptions:
14+
- UnifiedEndpointMaaS
15+
- MaaP
16+
- ServerlessMaaS
17+
1218
tags:
1319
InferenceLegacyDate: '2025-06-09'
1420
InferenceDeprecationDate: '2025-06-30'
@@ -31,7 +37,6 @@ tags:
3137
playgroundRateLimitTier: "low"
3238
Featured: ""
3339
maas-inference: "true"
34-
deploymentOptions: "UnifiedEndpointMaaS, MaaP, ServerlessMaaS"
3540
SharedComputeCapacityEnabled: ''
3641
license: MIT
3742
disable-batch: "true"

assets/models/system/phi-3-small-128k-instruct/spec.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,12 @@ properties:
99
finetuning-tasks: chat-completion
1010
finetune-min-sku-spec: 96|4|880|256
1111
finetune-recommended-sku: Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4
12+
system_metadata:
13+
deploymentOptions:
14+
- UnifiedEndpointMaaS
15+
- MaaP
16+
- ServerlessMaaS
17+
1218
tags:
1319
InferenceLegacyDate: '2025-06-09'
1420
InferenceDeprecationDate: '2025-06-30'
@@ -30,7 +36,6 @@ tags:
3036
playgroundRateLimitTier: "low"
3137
Featured: ""
3238
maas-inference: "true"
33-
deploymentOptions: "UnifiedEndpointMaaS, MaaP, ServerlessMaaS"
3439
SharedComputeCapacityEnabled: ''
3540
license: MIT
3641
disable-batch: "true"

assets/models/system/phi-3-small-8k-instruct/spec.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,12 @@ properties:
99
finetuning-tasks: chat-completion
1010
finetune-min-sku-spec: 96|4|880|256
1111
finetune-recommended-sku: Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4
12+
system_metadata:
13+
deploymentOptions:
14+
- UnifiedEndpointMaaS
15+
- MaaP
16+
- ServerlessMaaS
17+
1218
tags:
1319
InferenceLegacyDate: '2025-06-09'
1420
InferenceDeprecationDate: '2025-06-30'
@@ -30,7 +36,6 @@ tags:
3036
playgroundRateLimitTier: "low"
3137
Featured: ""
3238
maas-inference: "true"
33-
deploymentOptions: "UnifiedEndpointMaaS, MaaP, ServerlessMaaS"
3439
license: MIT
3540
disable-batch: "true"
3641
task: chat-completion

assets/models/system/phi-3-vision-128k-instruct/spec.yaml

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,11 @@ properties:
66
languages: en
77
inference-min-sku-spec: 48|2|440|128
88
inference-recommended-sku: Standard_NC48ads_A100_v4, Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4
9+
system_metadata:
10+
deploymentOptions:
11+
- UnifiedEndpointMaaS
12+
- MaaP
13+
914
tags:
1015
InferenceLegacyDate: '2025-06-09'
1116
InferenceDeprecationDate: '2025-06-30'
@@ -15,7 +20,6 @@ tags:
1520
Featured: ""
1621
license: MIT
1722
disable-batch: "true"
18-
deploymentOptions: "UnifiedEndpointMaaS, MaaP"
1923
task: chat-completion
2024
hiddenlayerscanned: ""
2125
author: Microsoft

assets/models/system/phi-3.5-mini-128k-instruct/spec.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,12 @@ properties:
99
finetuning-tasks: chat-completion
1010
finetune-min-sku-spec: 24|1|220|64
1111
finetune-recommended-sku: Standard_NC24ads_A100_v4, Standard_NC48ads_A100_v4, Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4
12+
system_metadata:
13+
deploymentOptions:
14+
- UnifiedEndpointMaaS
15+
- MaaP
16+
- ServerlessMaaS
17+
1218
tags:
1319
InferenceLegacyDate: '2025-06-09'
1420
InferenceDeprecationDate: '2025-06-30'
@@ -31,7 +37,6 @@ tags:
3137
playgroundRateLimitTier: "low"
3238
Featured: ""
3339
maas-inference: "true"
34-
deploymentOptions: "UnifiedEndpointMaaS, MaaP, ServerlessMaaS"
3540
license: MIT
3641
disable-batch: "true"
3742
task: chat-completion

assets/models/system/phi-3.5-moe-128k-instruct/spec.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,12 @@ properties:
99
finetuning-tasks: chat-completion
1010
finetune-min-sku-spec: 96|4|880|256
1111
finetune-recommended-sku: Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4
12+
system_metadata:
13+
deploymentOptions:
14+
- UnifiedEndpointMaaS
15+
- MaaP
16+
- ServerlessMaaS
17+
1218
tags:
1319
InferenceLegacyDate: '2025-06-09'
1420
InferenceDeprecationDate: '2025-06-30'
@@ -31,7 +37,6 @@ tags:
3137
playgroundRateLimitTier: "low"
3238
Featured: ""
3339
maas-inference: "true"
34-
deploymentOptions: "UnifiedEndpointMaaS, MaaP, ServerlessMaaS"
3540
license: MIT
3641
disable-batch: "true"
3742
task: chat-completion

0 commit comments

Comments
 (0)