-
Notifications
You must be signed in to change notification settings - Fork 46
Expand file tree
/
Copy pathqwen2_5_ov_config.json
More file actions
29 lines (29 loc) · 1.04 KB
/
qwen2_5_ov_config.json
File metadata and controls
29 lines (29 loc) · 1.04 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
{
"input_model": { "type": "HfModel", "model_path": "Qwen/Qwen2.5-Coder-0.5B-Instruct" },
"systems": {
"local_system": {
"type": "LocalSystem",
"accelerators": [ { "device":"gpu", "execution_providers": [ "OpenVINOExecutionProvider" ] } ]
}
},
"passes": {
"optimum_convert": {
"type": "OpenVINOOptimumConversion",
"extra_args": { "device": "gpu", "task": "text-generation-with-past" },
"ov_quant_config": { "weight_format": "int4", "group_size": 128, "ratio": 0.8 }
},
"io_update": { "type": "OpenVINOIoUpdate", "static": false, "reuse_cache": true },
"encapsulation": {
"type": "OpenVINOEncapsulation",
"target_device": "gpu",
"keep_ov_dynamic_dims": true,
"ov_version": "2025.1",
"reuse_cache": true
}
},
"search_strategy": false,
"target": "local_system",
"cache_dir": "cache",
"evaluate_input_model": false,
"output_dir": "model/qwen2_5"
}