-
Notifications
You must be signed in to change notification settings - Fork 30
Expand file tree
/
Copy pathconfig.json
More file actions
201 lines (201 loc) · 6.51 KB
/
config.json
File metadata and controls
201 lines (201 loc) · 6.51 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
{
"demo": {
"components": [
{ "category": "llm-model", "component": "vllm" },
{ "category": "o11y", "component": "langfuse" },
{ "category": "gui-app", "component": "openwebui" },
{ "category": "vector-database", "component": "qdrant" },
{ "category": "embedding-model", "component": "tei" },
{ "category": "ai-gateway", "component": "litellm" }
],
"examples": [
{ "category": "mcp-server", "example": "calculator" },
{ "category": "strands-agents", "example": "calculator-agent" }
]
},
"llm-model": {
"vllm": {
"models": [
{ "name": "qwen3-30b-instruct-fp8", "deploy": true },
{ "name": "qwen3-30b-thinking-fp8", "deploy": false },
{ "name": "qwen3-32b-fp8", "deploy": true },
{ "name": "qwen3-next-80b-instruct", "deploy": false },
{ "name": "qwen3-next-80b-instruct-fp8", "deploy": false },
{ "name": "qwen3-next-80b-thinking", "deploy": false },
{ "name": "qwen3-next-80b-thinking-fp8", "deploy": false },
{ "name": "qwen3-coder-30b-fp8", "deploy": false },
{ "name": "qwen3-coder-480b-fp8", "deploy": false },
{ "name": "qwen3-omni-30b-instruct", "deploy": false },
{ "name": "qwen3-omni-30b-thinking", "deploy": false },
{ "name": "qwen3-omni-30b-captioner", "deploy": false },
{ "name": "gpt-oss-20b", "deploy": false },
{ "name": "gpt-oss-120b", "deploy": false },
{ "name": "deepseek-r1-qwen3-8b", "deploy": false },
{ "name": "gemma3-27b-gptq", "deploy": false },
{ "name": "magistral-24b-fp8", "deploy": false },
{ "name": "llama-4-scout-17b-16e-instruct-fp8", "deploy": false },
{ "name": "deepseek-r1-qwen3-8b-neuron", "deploy": false },
{ "name": "qwen3-8b-neuron", "deploy": false }
]
},
"sglang": {
"models": [
{ "name": "qwen3-30b-instruct-fp8", "deploy": true },
{ "name": "qwen3-30b-thinking-fp8", "deploy": false },
{ "name": "qwen3-32b-fp8", "deploy": true },
{ "name": "qwen3-coder-30b-fp8", "deploy": false },
{ "name": "qwen3-coder-480b-fp8", "deploy": false },
{ "name": "gpt-oss-20b", "deploy": false }
]
},
"tgi": {
"models": [
{ "name": "deepseek-r1-qwen3-8b", "deploy": false },
{ "name": "qwen3-8b", "deploy": false },
{ "name": "qwen3-8b-fp8", "deploy": false }
]
},
"ollama": {
"models": [
"qwen3:32b",
"qwen3:30b",
"gemma3:27b",
"deepseek-r1:8b",
"nomic-embed-text:v1.5"
]
}
},
"embedding-model": {
"tei": {
"models": [
{ "name": "qwen3-embedding-06b-bf16-cpu", "deploy": true },
{ "name": "qwen3-embedding-06b-bf16", "deploy": false },
{ "name": "qwen3-embedding-4b-bf16", "deploy": false },
{ "name": "qwen3-embedding-8b-bf16", "deploy": false }
]
}
},
"bedrock": {
"region": null,
"llm": {
"models": [
{ "name": "amazon-nova-premier", "model": "us.amazon.nova-premier-v1:0" },
{ "name": "amazon-nova-2-lite", "model": "global.amazon.nova-2-lite-v1:0" },
{ "name": "claude-opus-4.6", "model": "global.anthropic.claude-opus-4-6-20260214-v1:0" },
{ "name": "claude-4.5-opus", "model": "global.anthropic.claude-opus-4-5-20251101-v1:0" },
{ "name": "claude-4.5-sonnet", "model": "global.anthropic.claude-sonnet-4-5-20250929-v1:0" },
{ "name": "claude-4.5-haiku", "model": "global.anthropic.claude-haiku-4-5-20251001-v1:0" },
{ "name": "llama4-maverick", "model": "us.meta.llama4-maverick-17b-instruct-v1:0" },
{ "name": "llama4-scout", "model": "us.meta.llama4-scout-17b-instruct-v1:0" }
]
},
"embedding": { "models": [] }
},
"litellm": {
"enableBedrockGuardrail": false,
"enableGuardrailsAI": false
},
"ai-agent": {
"openclaw": {
"env": {
"LITELLM_MODEL_NAME": "bedrock/claude-4.5-sonnet",
"OPENCLAW_GATEWAY_TOKEN": "openclaw-gateway-token"
}
}
},
"examples": {
"agno": {
"calculator-agent": {
"env": {
"USE_BEDROCK": false,
"BEDROCK_MODEL": "us.anthropic.claude-3-7-sonnet-20250219-v1:0",
"LITELLM_MODEL_NAME": "vllm/qwen3-30b-instruct-fp8",
"USE_MCP_TOOLS": true
}
}
},
"strands-agents": {
"calculator-agent": {
"env": {
"USE_BEDROCK": false,
"BEDROCK_MODEL": "us.anthropic.claude-3-7-sonnet-20250219-v1:0",
"LITELLM_MODEL_NAME": "vllm/qwen3-30b-instruct-fp8",
"USE_MCP_TOOLS": true,
"USE_MCP_GATEWAY": true
}
}
},
"openclaw": {
"doc-writer": {
"env": {
"LITELLM_MODEL_NAME": "bedrock/claude-4.5-sonnet",
"OPENCLAW_GATEWAY_TOKEN": "openclaw-gateway-token"
}
},
"devops-agent": {
"env": {
"LITELLM_MODEL_NAME": "bedrock/claude-4.5-sonnet",
"OPENCLAW_GATEWAY_TOKEN": "openclaw-gateway-token"
}
}
}
},
"docker": {
"useBuildx": true,
"arch": "arm64"
},
"terraform": {
"vars": {
"efs_throughput_mode": "bursting",
"enable_ecr_pull_through_cache": false,
"dockerhub_username": "",
"dockerhub_access_token": "",
"github_username": "",
"github_token": ""
}
},
"platform": {
"monitoring": {
"grafanaAdminPassword": "admin",
"retention": "7d",
"enablePersistentStorage": false,
"prometheusStorageSize": "50Gi",
"alertmanagerEnabled": false
},
"type": "eks",
"eks": {
"storageClass": "efs",
"gpuNodeSelectorKey": "nvidia.com/gpu.present",
"gpuNodeSelectorValue": "true",
"gpuOperator": {
"driverEnabled": false,
"toolkitEnabled": false,
"devicePluginEnabled": false,
"gfdEnabled": true,
"dcgmExporterEnabled": true,
"gdsEnabled": true,
"nfdEnabled": false,
"migManagerEnabled": false,
"useAMP": false,
"ampWorkspaceId": ""
},
"dynamoPlatform": {
"releaseVersion": "0.9.1",
"namespace": "dynamo-system",
"groveEnabled": true,
"kaiSchedulerEnabled": true
}
},
"k8s": {
"storageClass": "nfs",
"gpuNodeSelectorKey": "nvidia.com/gpu.present",
"gpuNodeSelectorValue": "true",
"dynamoPlatform": {
"releaseVersion": "0.9.0-post1",
"namespace": "dynamo-system",
"groveEnabled": true,
"kaiSchedulerEnabled": true
}
}
}
}