forked from microsoft/olive-recipes
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathphi_4_gpu_context_dy.json
More file actions
30 lines (30 loc) · 1.04 KB
/
phi_4_gpu_context_dy.json
File metadata and controls
30 lines (30 loc) · 1.04 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
{
"input_model": { "type": "HfModel", "model_path": "microsoft/Phi-4" },
"systems": {
"local_system": {
"type": "LocalSystem",
"accelerators": [ { "execution_providers": [ "OpenVINOExecutionProvider" ] } ]
}
},
"passes": {
"optimum_convert": {
"type": "OpenVINOOptimumConversion",
"extra_args": { "device": "gpu", "task": "text-generation-with-past" },
"ov_quant_config": { "weight_format": "int4", "group_size": 128, "ratio": 0.8 }
},
"io_update": { "type": "OpenVINOIoUpdate", "static": false, "reuse_cache": true },
"encapsulation": {
"type": "OpenVINOEncapsulation",
"target_device": "gpu",
"keep_ov_dynamic_dims": true,
"ov_version": "2025.2",
"reuse_cache": true
}
},
"search_strategy": false,
"host": "local_system",
"cache_dir": "cache",
"clean_cache": true,
"evaluate_input_model": false,
"output_dir": "models/Phi_4_gpu_context_dy"
}