-
Notifications
You must be signed in to change notification settings - Fork 120
Expand file tree
/
Copy pathvultr.json
More file actions
53 lines (53 loc) · 1.32 KB
/
vultr.json
File metadata and controls
53 lines (53 loc) · 1.32 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
{
"name": "Vultr",
"id": "vultr",
"type": "openai-compat",
"api_key": "$VULTR_API_KEY",
"api_endpoint": "https://api.vultrinference.com/",
"default_large_model_id": "kimi-k2-instruct",
"default_small_model_id": "qwen2.5-32b-instruct",
"models": [
{
"id": "kimi-k2-instruct",
"name": "Kimi K2 Instruct",
"cost_per_1m_in": 1,
"cost_per_1m_out": 3,
"context_window": 262144,
"default_max_tokens": 8192,
"can_reason": true
},
{
"id": "llama-3.1-70b-instruct-fp8",
"name": "Llama 3.1 70B Instruct FP8",
"cost_per_1m_in": 0.35,
"cost_per_1m_out": 0.35,
"context_window": 131072,
"default_max_tokens": 4096
},
{
"id": "mistral-7b-v0.3",
"name": "Mistral 7B v0.3",
"cost_per_1m_in": 0.05,
"cost_per_1m_out": 0.05,
"context_window": 32768,
"default_max_tokens": 4096
},
{
"id": "deepseek-r1",
"name": "DeepSeek R1",
"cost_per_1m_in": 0.55,
"cost_per_1m_out": 2.19,
"context_window": 128000,
"default_max_tokens": 4096,
"can_reason": true
},
{
"id": "qwen2.5-32b-instruct",
"name": "Qwen 2.5 32B Instruct",
"cost_per_1m_in": 0.14,
"cost_per_1m_out": 0.42,
"context_window": 32768,
"default_max_tokens": 4096
}
]
}