Skip to content

Commit 860e149

Browse files
authored
Merge branch 'main' into dev/vjatoth-qti/recipes-qnn-gpu
2 parents 7512632 + ee5e129 commit 860e149

12 files changed

Lines changed: 12 additions & 12 deletions

File tree

Qwen-Qwen2.5-1.5B-Instruct/QNN/config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,7 @@
7575
"quant_preprocess": true,
7676
"op_types_to_exclude": [ "GatherBlockQuantized", "GroupQueryAttention", "MatMulNBits" ],
7777
"save_as_external_data": true,
78-
"extra_option": { "CalibStridedMinMax": 4 }
78+
"extra_options": { "CalibStridedMinMax": 4 }
7979
},
8080
"sp": { "type": "SplitModel" },
8181
"st": { "type": "StaticLLM", "batch_size": 1, "context_length": 64 },

Qwen-Qwen2.5-1.5B-Instruct/aitk/qwen2_5_qnn_config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -113,7 +113,7 @@
113113
"MatMulNBits"
114114
],
115115
"save_as_external_data": true,
116-
"extra_option": {
116+
"extra_options": {
117117
"CalibStridedMinMax": 4
118118
}
119119
},

Qwen-Qwen2.5-7B-Instruct/QNN/config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,7 @@
7575
"quant_preprocess": true,
7676
"op_types_to_exclude": [ "GatherBlockQuantized", "GroupQueryAttention", "MatMulNBits" ],
7777
"save_as_external_data": true,
78-
"extra_option": { "CalibStridedMinMax": 4 }
78+
"extra_options": { "CalibStridedMinMax": 4 }
7979
},
8080
"sp": { "type": "SplitModel" },
8181
"st": { "type": "StaticLLM", "batch_size": 1, "context_length": 64 },

deepseek-ai-DeepSeek-R1-Distill-Qwen-1.5B/aitk/deepseek_qnn_config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -113,7 +113,7 @@
113113
"MatMulNBits"
114114
],
115115
"save_as_external_data": true,
116-
"extra_option": {
116+
"extra_options": {
117117
"CalibStridedMinMax": 4
118118
}
119119
},

meta-llama-Llama-3.1-8B-Instruct/QNN/config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,7 @@
7575
"quant_preprocess": true,
7676
"op_types_to_exclude": [ "GatherBlockQuantized", "GroupQueryAttention", "MatMulNBits" ],
7777
"save_as_external_data": true,
78-
"extra_option": { "CalibStridedMinMax": 4 }
78+
"extra_options": { "CalibStridedMinMax": 4 }
7979
},
8080
"sp": { "type": "SplitModel" },
8181
"st": { "type": "StaticLLM", "batch_size": 1, "context_length": 64 },

meta-llama-Llama-3.1-8B-Instruct/aitk/llama3_1_qnn_config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -113,7 +113,7 @@
113113
"MatMulNBits"
114114
],
115115
"save_as_external_data": true,
116-
"extra_option": {
116+
"extra_options": {
117117
"CalibStridedMinMax": 4
118118
}
119119
},

meta-llama-Llama-3.2-1B-Instruct/aitk/llama3_2_qnn_config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -113,7 +113,7 @@
113113
"MatMulNBits"
114114
],
115115
"save_as_external_data": true,
116-
"extra_option": {
116+
"extra_options": {
117117
"CalibStridedMinMax": 4
118118
}
119119
},

microsoft-Phi-3-mini-128k-instruct/QNN/config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,7 @@
7575
"quant_preprocess": true,
7676
"op_types_to_exclude": [ "GatherBlockQuantized", "GroupQueryAttention", "MatMulNBits" ],
7777
"save_as_external_data": true,
78-
"extra_option": { "CalibStridedMinMax": 4 }
78+
"extra_options": { "CalibStridedMinMax": 4 }
7979
},
8080
"sp": { "type": "SplitModel" },
8181
"st": { "type": "StaticLLM", "batch_size": 1, "context_length": 64 },

microsoft-Phi-3-mini-4k-instruct/QNN/config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,7 @@
7575
"quant_preprocess": true,
7676
"op_types_to_exclude": [ "GatherBlockQuantized", "GroupQueryAttention", "MatMulNBits" ],
7777
"save_as_external_data": true,
78-
"extra_option": { "CalibStridedMinMax": 4 }
78+
"extra_options": { "CalibStridedMinMax": 4 }
7979
},
8080
"sp": { "type": "SplitModel" },
8181
"st": { "type": "StaticLLM", "batch_size": 1, "context_length": 64 },

microsoft-Phi-3.5-mini-instruct/QNN/config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -73,7 +73,7 @@
7373
"quant_preprocess": true,
7474
"op_types_to_exclude": [ "GatherBlockQuantized", "GroupQueryAttention", "MatMulNBits" ],
7575
"save_as_external_data": true,
76-
"extra_option": { "CalibStridedMinMax": 4 }
76+
"extra_options": { "CalibStridedMinMax": 4 }
7777
},
7878
"sp": { "type": "SplitModel" },
7979
"st": { "type": "StaticLLM", "batch_size": 1, "context_length": 64 },

0 commit comments

Comments
 (0)