-
Notifications
You must be signed in to change notification settings - Fork 53
Expand file tree
/
Copy pathdeepseek_ov_config.json.config
More file actions
91 lines (91 loc) · 2.57 KB
/
Copy pathdeepseek_ov_config.json.config
File metadata and controls
91 lines (91 loc) · 2.57 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
{
"$schema": "https://github.com/microsoft/olive-recipes/raw/refs/heads/main/.aitk/configs/config_schema.json",
"name": "Convert to Intel GPU/CPU",
"isLLM": true,
"isIntel": true,
"intelRuntimeValues": [
"gpu",
"cpu"
],
"debugInfo": {
"autoGenerated": true,
"useOpenVINOOptimumConversion": "optimum_convert"
},
"runtime": {
"autoGenerated": true,
"name": "Evaluate on",
"type": "enum",
"displayNames": [
"Intel CPU",
"Intel GPU"
],
"path": "systems.local_system.accelerators.0.device",
"values": [
"cpu",
"gpu"
],
"readOnly": false
},
"optimizationPaths": [
{
"path": "passes.optimum_convert.ov_quant_config.weight_format"
}
],
"optimizationDefault": "int4",
"sections": [
{
"autoGenerated": true,
"name": "Convert",
"phase": "Conversion",
"parameters": [],
"toggle": {
"autoGenerated": true,
"name": "Convert to ONNX format",
"type": "bool",
"path": "passes.optimum_convert",
"actions": [
[],
[]
],
"readOnly": true
}
},
{
"autoGenerated": true,
"name": "Quantize",
"phase": "Quantization",
"parameters": [
{
"autoGenerated": true,
"name": "Quantization Dataset",
"tags": [
"QuantizationDataset"
],
"type": "enum",
"path": "passes.optimum_convert.ov_quant_config.dataset",
"values": [
"wikitext2"
],
"template": {
"path": "passes.optimum_convert.ov_quant_config.dataset",
"values": [
"wikitext2"
],
"template": "QuantizationDataset"
}
}
],
"toggle": {
"autoGenerated": true,
"name": "Quantize model",
"type": "bool",
"path": "passes.optimum_convert",
"actions": [
[],
[]
],
"readOnly": true
}
}
]
}