Skip to content

Commit cc79c5a

Browse files
Update Whisper model to a quantized version (#5013)
Co-authored-by: kunal-vaishnavi <115581922+kunal-vaishnavi@users.noreply.github.com>
1 parent 09c92d4 commit cc79c5a

10 files changed

Lines changed: 31 additions & 31 deletions

File tree

assets/models/foundrylocal/openai-whisper-base-generic-cpu/model.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
path:
22
container_name: models
3-
container_path: foundrylocal/models/openai-whisper-base/onnx/cpu_and_mobile/v2
4-
storage_name: foundrylocalmodels
3+
container_path: foundrylocal/models/openai-whisper-base/onnx/cpu_and_mobile/v3
4+
storage_name: foundrylocalassetdata
55
type: azureblob
66
publish:
77
description: description.md

assets/models/foundrylocal/openai-whisper-base-generic-cpu/spec.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
22
name: openai-whisper-base-generic-cpu
3-
version: 2
3+
version: 3
44
path: ./
55
tags:
66
foundryLocal: ""
@@ -12,7 +12,7 @@ tags:
1212
task: automatic-speech-recognition
1313
maxOutputTokens: 2048
1414
alias: whisper-base
15-
directoryPath: v2
15+
directoryPath: v3
1616
promptTemplate: "{\"prompt\": \"<|startoftranscript|> <|en|> <|transcribe|> <|notimestamps|>\"}"
1717
contextLength: 448
1818
capabilities: ""
@@ -30,5 +30,5 @@ variantInfo:
3030
quantization: ['RTN']
3131
device: 'cpu'
3232
executionProvider: 'CPUExecutionProvider'
33-
fileSizeBytes: 402590167
34-
vRamFootprintBytes: 402590167
33+
fileSizeBytes: 215285518
34+
vRamFootprintBytes: 215285518

assets/models/foundrylocal/openai-whisper-large-v3-turbo-generic-cpu/model.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
path:
2-
container_name: whisper-models
3-
container_path: whisper-large-v3-turbo/cpu-fp32/v2
4-
storage_name: foundrylocalmodels
2+
container_name: models
3+
container_path: foundrylocal/models/openai-whisper-large-v3-turbo/onnx/cpu_and_mobile/v3
4+
storage_name: foundrylocalassetdata
55
type: azureblob
66
publish:
77
description: description.md

assets/models/foundrylocal/openai-whisper-large-v3-turbo-generic-cpu/spec.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
22
name: openai-whisper-large-v3-turbo-generic-cpu
3-
version: 2
3+
version: 3
44
path: ./
55
tags:
66
foundryLocal: ""
@@ -12,7 +12,7 @@ tags:
1212
task: automatic-speech-recognition
1313
maxOutputTokens: 2048
1414
alias: whisper-large-v3-turbo
15-
directoryPath: v2
15+
directoryPath: v3
1616
promptTemplate: "{\"prompt\": \"<|startoftranscript|> <|en|> <|transcribe|> <|notimestamps|>\"}"
1717
contextLength: 448
1818
capabilities: ""
@@ -30,5 +30,5 @@ variantInfo:
3030
quantization: ['RTN']
3131
device: 'cpu'
3232
executionProvider: 'CPUExecutionProvider'
33-
fileSizeBytes: 9438190632
34-
vRamFootprintBytes: 9438528266
33+
fileSizeBytes: 1678544910
34+
vRamFootprintBytes: 1678544910

assets/models/foundrylocal/openai-whisper-medium-generic-cpu/model.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
path:
22
container_name: models
3-
container_path: foundrylocal/models/openai-whisper-medium/onnx/cpu_and_mobile/v2
4-
storage_name: foundrylocalmodels
3+
container_path: foundrylocal/models/openai-whisper-medium/onnx/cpu_and_mobile/v3
4+
storage_name: foundrylocalassetdata
55
type: azureblob
66
publish:
77
description: description.md

assets/models/foundrylocal/openai-whisper-medium-generic-cpu/spec.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
22
name: openai-whisper-medium-generic-cpu
3-
version: 2
3+
version: 3
44
path: ./
55
tags:
66
foundryLocal: ""
@@ -12,7 +12,7 @@ tags:
1212
task: automatic-speech-recognition
1313
maxOutputTokens: 2048
1414
alias: whisper-medium
15-
directoryPath: v2
15+
directoryPath: v3
1616
promptTemplate: "{\"prompt\": \"<|startoftranscript|> <|en|> <|transcribe|> <|notimestamps|>\"}"
1717
contextLength: 448
1818
capabilities: ""
@@ -30,5 +30,5 @@ variantInfo:
3030
quantization: ['RTN']
3131
device: 'cpu'
3232
executionProvider: 'CPUExecutionProvider'
33-
fileSizeBytes: 3274421068
34-
vRamFootprintBytes: 3274421068
33+
fileSizeBytes: 1334385110
34+
vRamFootprintBytes: 1334385110

assets/models/foundrylocal/openai-whisper-small-generic-cpu/model.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
path:
22
container_name: models
3-
container_path: foundrylocal/models/openai-whisper-small/onnx/cpu_and_mobile/v2
4-
storage_name: foundrylocalmodels
3+
container_path: foundrylocal/models/openai-whisper-small/onnx/cpu_and_mobile/v3
4+
storage_name: foundrylocalassetdata
55
type: azureblob
66
publish:
77
description: description.md

assets/models/foundrylocal/openai-whisper-small-generic-cpu/spec.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
22
name: openai-whisper-small-generic-cpu
3-
version: 2
3+
version: 3
44
path: ./
55
tags:
66
foundryLocal: ""
@@ -12,7 +12,7 @@ tags:
1212
task: automatic-speech-recognition
1313
maxOutputTokens: 2048
1414
alias: whisper-small
15-
directoryPath: v2
15+
directoryPath: v3
1616
promptTemplate: "{\"prompt\": \"<|startoftranscript|> <|en|> <|transcribe|> <|notimestamps|>\"}"
1717
contextLength: 448
1818
capabilities: ""
@@ -30,5 +30,5 @@ variantInfo:
3030
quantization: ['RTN']
3131
device: 'cpu'
3232
executionProvider: 'CPUExecutionProvider'
33-
fileSizeBytes: 1132432089
34-
vRamFootprintBytes: 1132432089
33+
fileSizeBytes: 516028869
34+
vRamFootprintBytes: 516028869

assets/models/foundrylocal/openai-whisper-tiny-generic-cpu/model.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
path:
22
container_name: models
3-
container_path: foundrylocal/models/openai-whisper-tiny/onnx/cpu_and_mobile/v3
4-
storage_name: foundrylocalmodels
3+
container_path: foundrylocal/models/openai-whisper-tiny/onnx/cpu_and_mobile/v4
4+
storage_name: foundrylocalassetdata
55
type: azureblob
66
publish:
77
description: description.md

assets/models/foundrylocal/openai-whisper-tiny-generic-cpu/spec.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
22
name: openai-whisper-tiny-generic-cpu
3-
version: 3
3+
version: 4
44
path: ./
55
tags:
66
foundryLocal: ""
@@ -12,7 +12,7 @@ tags:
1212
task: automatic-speech-recognition
1313
maxOutputTokens: 2048
1414
alias: whisper-tiny
15-
directoryPath: v3
15+
directoryPath: v4
1616
promptTemplate: "{\"prompt\": \"<|startoftranscript|> <|en|> <|transcribe|> <|notimestamps|>\"}"
1717
contextLength: 448
1818
capabilities: ""
@@ -30,5 +30,5 @@ variantInfo:
3030
quantization: ['RTN']
3131
device: 'cpu'
3232
executionProvider: 'CPUExecutionProvider'
33-
fileSizeBytes: 236654475
34-
vRamFootprintBytes: 236654475
33+
fileSizeBytes: 138106077
34+
vRamFootprintBytes: 138106077

0 commit comments

Comments
 (0)