-
Notifications
You must be signed in to change notification settings - Fork 541
Expand file tree
/
Copy pathconfig-profile.yaml
More file actions
44 lines (44 loc) · 1.1 KB
/
config-profile.yaml
File metadata and controls
44 lines (44 loc) · 1.1 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
apiVersion: apps/v1
kind: Deployment
metadata:
name: mock-qwen3-8b
labels:
model.aibrix.ai/name: "qwen3-8b"
model.aibrix.ai/port: "8000"
adapter.model.aibrix.ai/enabled: "true"
spec:
replicas: 1
selector:
matchLabels:
adapter.model.aibrix.ai/enabled: "true"
model.aibrix.ai/name: "qwen3-8b"
app: "mock-qwen3-8b"
template:
metadata:
labels:
adapter.model.aibrix.ai/enabled: "true"
model.aibrix.ai/name: "qwen3-8b"
app: "mock-qwen3-8b"
annotations:
model.aibrix.ai/config: |
{
"defaultProfile": "least-request",
"profiles": {
"least-request": {
"routingStrategy": "least-request"
},
"throughput": {
"routingStrategy": "throughput"
}
}
}
spec:
serviceAccountName: mocked-app-sa
containers:
- name: llm-engine
image: aibrix/vllm-mock:nightly
command:
- python3
- app.py
- --api_key
- test-key-1234567890