forked from opendatahub-io/opendatahub-tests
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathopt125m_cpu.py
More file actions
27 lines (27 loc) · 977 Bytes
/
opt125m_cpu.py
File metadata and controls
27 lines (27 loc) · 977 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
OPT125M_CPU_INFERENCE_CONFIG = {
"default_query_model": {
"query_input": "What is the boiling point of water?",
"query_output": r'.*',
"use_regex": True,
},
"chat_completions": {
"http": {
"endpoint": "v1/chat/completions",
"header": "Content-Type:application/json",
"body": '{"model": "$model_name", "messages": [{"role": "user", "content": "$query_input"}], "max_tokens": 50, "temperature": 0.0, "stream": false}',
"response_fields_map": {
"response_output": "output",
},
},
},
"completions": {
"http": {
"endpoint": "v1/completions",
"header": "Content-Type:application/json",
"body": '{"model": "$model_name", "prompt": "$query_input", "max_tokens": 50, "temperature": 0.0}',
"response_fields_map": {
"response_output": "output",
},
},
},
}