Skip to content

Commit e5c12be

Browse files
authored
Add v3 local models (#4180)
* Update v3 local models * Update v3 model paths
1 parent 1b65861 commit e5c12be

30 files changed

Lines changed: 45 additions & 45 deletions

File tree

assets/models/system/DeepSeek-R1-Distill-Qwen-1.5B-cuda-gpu/model.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
path:
22
container_name: models
3-
container_path: foundrylocal/fl-perf-improvements/deepseek-r1-distill-qwen-1.5b/onnx/cuda/cuda-int4-kquant-block-128-mixed/v2
3+
container_path: foundrylocal/fl-perf-improvements/deepseek-r1-distill-qwen-1.5b/onnx/cuda/cuda-int4-kquant-block-128-mixed/v3
44
storage_name: automlcesdkdataresources
55
type: azureblob
66
publish:

assets/models/system/DeepSeek-R1-Distill-Qwen-1.5B-cuda-gpu/spec.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
22
name: deepseek-r1-distill-qwen-1.5b-cuda-gpu
3-
version: 2
3+
version: 3
44
path: ./
55
tags:
66
foundryLocal: ""
@@ -12,7 +12,7 @@ tags:
1212
task: chat-completion
1313
maxOutputTokens: 2048
1414
alias: deepseek-r1-1.5b
15-
directoryPath: v2
15+
directoryPath: v3
1616
promptTemplate: "{\"assistant\": \"{Content}\", \"prompt\": \"\\\\u003C\\\\uFF5CUser\\\\uFF5C\\\\u003E{Content}\\\\u003C\\\\uFF5CAssistant\\\\uFF5C\\\\u003E\"}"
1717
parameterSchema: "{\"enabled\": [{\"name\": \"temperature\", \"default\": 0.6}, {\"name\": \"top_p\", \"default\": 0.95}, {\"name\": \"top_k\", \"default\": 40}, {\"name\": \"presence_penalty\", \"default\": 1.3}]}"
1818
type: custom_model

assets/models/system/DeepSeek-R1-Distill-Qwen-1.5B-generic-cpu/model.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
path:
22
container_name: models
3-
container_path: foundrylocal/fl-perf-improvements/deepseek-r1-distill-qwen-1.5b/onnx/cpu_and_mobile/cpu-int4-kquant-block-128-mixed-acc-level-4/v2
3+
container_path: foundrylocal/fl-perf-improvements/deepseek-r1-distill-qwen-1.5b/onnx/cpu_and_mobile/cpu-int4-kquant-block-128-mixed-acc-level-4/v3
44
storage_name: automlcesdkdataresources
55
type: azureblob
66
publish:

assets/models/system/DeepSeek-R1-Distill-Qwen-1.5B-generic-cpu/spec.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
22
name: deepseek-r1-distill-qwen-1.5b-generic-cpu
3-
version: 2
3+
version: 3
44
path: ./
55
tags:
66
foundryLocal: ""
@@ -12,7 +12,7 @@ tags:
1212
task: chat-completion
1313
maxOutputTokens: 2048
1414
alias: deepseek-r1-1.5b
15-
directoryPath: v2
15+
directoryPath: v3
1616
promptTemplate: "{\"assistant\": \"{Content}\", \"prompt\": \"\\\\u003C\\\\uFF5CUser\\\\uFF5C\\\\u003E{Content}\\\\u003C\\\\uFF5CAssistant\\\\uFF5C\\\\u003E\"}"
1717
parameterSchema: "{\"enabled\": [{\"name\": \"temperature\", \"default\": 0.6}, {\"name\": \"top_p\", \"default\": 0.95}, {\"name\": \"top_k\", \"default\": 40}, {\"name\": \"presence_penalty\", \"default\": 1.1}]}"
1818
type: custom_model

assets/models/system/DeepSeek-R1-Distill-Qwen-1.5B-generic-gpu/model.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
path:
22
container_name: models
3-
container_path: foundrylocal/fl-perf-improvements/deepseek-r1-distill-qwen-1.5b/onnx/webgpu/webgpu-int4-kquant-block-32-mixed-acc-level-4/v1
3+
container_path: foundrylocal/fl-perf-improvements/deepseek-r1-distill-qwen-1.5b/onnx/webgpu/webgpu-int4-kquant-block-32-mixed-acc-level-4/v3
44
storage_name: automlcesdkdataresources
55
type: azureblob
66
publish:

assets/models/system/DeepSeek-R1-Distill-Qwen-1.5B-generic-gpu/spec.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
22
name: deepseek-r1-distill-qwen-1.5b-generic-gpu
3-
version: 2
3+
version: 3
44
path: ./
55
tags:
66
foundryLocal: ""
@@ -12,7 +12,7 @@ tags:
1212
task: chat-completion
1313
maxOutputTokens: 2048
1414
alias: deepseek-r1-1.5b
15-
directoryPath: v1
15+
directoryPath: v3
1616
promptTemplate: "{\"assistant\": \"{Content}\", \"prompt\": \"\\\\u003C\\\\uFF5CUser\\\\uFF5C\\\\u003E{Content}\\\\u003C\\\\uFF5CAssistant\\\\uFF5C\\\\u003E\"}"
1717
parameterSchema: "{\"enabled\": [{\"name\": \"temperature\", \"default\": 0.6}, {\"name\": \"top_p\", \"default\": 0.95}, {\"name\": \"top_k\", \"default\": 40}, {\"name\": \"presence_penalty\", \"default\": 1.3}]}"
1818
type: custom_model

assets/models/system/DeepSeek-R1-Distill-Qwen-7B-cuda-gpu/model.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
path:
22
container_name: models
3-
container_path: foundrylocal/fl-perf-improvements/deepseek-r1-distill-qwen-7b/onnx/cuda/cuda-int4-kquant-block-128-mixed/v2
3+
container_path: foundrylocal/fl-perf-improvements/deepseek-r1-distill-qwen-7b/onnx/cuda/cuda-int4-kquant-block-128-mixed/v3
44
storage_name: automlcesdkdataresources
55
type: azureblob
66
publish:

assets/models/system/DeepSeek-R1-Distill-Qwen-7B-cuda-gpu/spec.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
22
name: deepseek-r1-distill-qwen-7b-cuda-gpu
3-
version: 2
3+
version: 3
44
path: ./
55
tags:
66
foundryLocal: ""
@@ -12,7 +12,7 @@ tags:
1212
task: chat-completion
1313
maxOutputTokens: 2048
1414
alias: deepseek-r1-7b
15-
directoryPath: v2
15+
directoryPath: v3
1616
promptTemplate: "{\"assistant\": \"{Content}\", \"prompt\": \"\\\\u003C\\\\uFF5CUser\\\\uFF5C\\\\u003E{Content}\\\\u003C\\\\uFF5CAssistant\\\\uFF5C\\\\u003E\"}"
1717
type: custom_model
1818
variantInfo:

assets/models/system/DeepSeek-R1-Distill-Qwen-7B-generic-cpu/model.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
path:
22
container_name: models
3-
container_path: foundrylocal/fl-perf-improvements/deepseek-r1-distill-qwen-7b/onnx/cpu_and_mobile/cpu-int4-kquant-block-128-mixed-acc-level-4/v2
3+
container_path: foundrylocal/fl-perf-improvements/deepseek-r1-distill-qwen-7b/onnx/cpu_and_mobile/cpu-int4-kquant-block-128-mixed-acc-level-4/v3
44
storage_name: automlcesdkdataresources
55
type: azureblob
66
publish:

assets/models/system/DeepSeek-R1-Distill-Qwen-7B-generic-cpu/spec.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
22
name: deepseek-r1-distill-qwen-7b-generic-cpu
3-
version: 2
3+
version: 3
44
path: ./
55
tags:
66
foundryLocal: ""
@@ -12,7 +12,7 @@ tags:
1212
task: chat-completion
1313
maxOutputTokens: 2048
1414
alias: deepseek-r1-7b
15-
directoryPath: v2
15+
directoryPath: v3
1616
promptTemplate: "{\"assistant\": \"{Content}\", \"prompt\": \"\\\\u003C\\\\uFF5CUser\\\\uFF5C\\\\u003E{Content}\\\\u003C\\\\uFF5CAssistant\\\\uFF5C\\\\u003E\"}"
1717
type: custom_model
1818
variantInfo:

0 commit comments

Comments
 (0)