File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -5,6 +5,11 @@ metadata:
55 namespace : llama-cpp
66data :
77 config.yaml : |
8+ # Global settings
9+ healthCheckTimeout: 1200
10+ logLevel: info
11+ startPort: 5800
12+
813 models:
914 kimi-k2-thinking-128k:
1015 cmd: >-
@@ -14,24 +19,27 @@ data:
1419 -b 4096
1520 -ub 4096
1621 -ngl 99
17- -ot .ffn_(up)_exps.=CPU
22+ -ot " .ffn_(up)_exps.=CPU"
1823 --host 0.0.0.0
1924 --port ${PORT}
2025 --threads 52
2126 --threads-batch 28
22- --flash-attn on
27+ -fa
2328 --cache-type-k q8_0
2429 --cache-type-v q8_0
2530 --parallel 2
2631 --special
2732 --no-warmup
28- --temp 1.0
29- --min-p 0.01
3033 --jinja
3134 --mlock
32- gpu_mode: dual
33- health_check_path: /health
34- timeout: 1200s
35+ env:
36+ - "CUDA_VISIBLE_DEVICES=0,1"
37+ checkEndpoint: /health
38+ ttl: 0
39+ aliases:
40+ - "kimi-k2"
41+ - "kimi"
42+
3543 gpt-oss-20b-128k:
3644 cmd: >-
3745 /app/llama-server
@@ -44,19 +52,21 @@ data:
4452 --port ${PORT}
4553 --threads 48
4654 --threads-batch 24
47- --flash-attn on
55+ -fa
4856 --cache-type-k q8_0
4957 --cache-type-v q8_0
5058 --parallel 2
5159 --special
5260 --no-warmup
53- --temp 0.7
54- --min-p 0.05
5561 --jinja
5662 --mlock
57- gpu_mode: dual
58- health_check_path: /health
59- timeout: 720s
63+ env:
64+ - "CUDA_VISIBLE_DEVICES=0,1"
65+ checkEndpoint: /health
66+ ttl: 0
67+ aliases:
68+ - "gpt-oss"
69+
6070 qwen3-thinking-128k:
6171 cmd: >-
6272 /app/llama-server
@@ -69,20 +79,78 @@ data:
6979 --port ${PORT}
7080 --threads 48
7181 --threads-batch 24
72- --flash-attn on
82+ -fa
7383 --cache-type-k q8_0
7484 --cache-type-v q8_0
7585 --parallel 2
7686 --special
7787 --no-warmup
78- --temp 0.6
79- --min-p 0.05
8088 --jinja
8189 --mlock
82- gpu_mode: dual
83- health_check_path: /health
84- timeout: 720s
85- default_model: kimi-k2-thinking-128k
86- health_check_interval: 60s
87- swap_timeout: 600s
88- cleanup_timeout: 120s
90+ env:
91+ - "CUDA_VISIBLE_DEVICES=0,1"
92+ checkEndpoint: /health
93+ ttl: 0
94+ aliases:
95+ - "qwen3-thinking"
96+ - "qwen3"
97+
98+ qwen3-coder-q8:
99+ cmd: >-
100+ /app/llama-server
101+ -m /models/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL.gguf
102+ -c 65536
103+ -b 4096
104+ -ub 4096
105+ -ngl 99
106+ --host 0.0.0.0
107+ --port ${PORT}
108+ --threads 48
109+ --threads-batch 24
110+ -fa
111+ --cache-type-k q8_0
112+ --cache-type-v q8_0
113+ --parallel 2
114+ --special
115+ --no-warmup
116+ --jinja
117+ --mlock
118+ env:
119+ - "CUDA_VISIBLE_DEVICES=0,1"
120+ checkEndpoint: /health
121+ ttl: 0
122+ aliases:
123+ - "qwen3-coder"
124+ - "coder"
125+
126+ magistral-small:
127+ cmd: >-
128+ /app/llama-server
129+ -m /models/Magistral-Small-2509-UD-Q8_K_XL.gguf
130+ -c 65536
131+ -b 4096
132+ -ub 4096
133+ -ngl 99
134+ --host 0.0.0.0
135+ --port ${PORT}
136+ --threads 48
137+ --threads-batch 24
138+ -fa
139+ --cache-type-k q8_0
140+ --cache-type-v q8_0
141+ --parallel 2
142+ --special
143+ --no-warmup
144+ --jinja
145+ --mlock
146+ env:
147+ - "CUDA_VISIBLE_DEVICES=0,1"
148+ checkEndpoint: /health
149+ ttl: 0
150+ aliases:
151+ - "magistral"
152+
153+ hooks:
154+ on_startup:
155+ preload:
156+ - "kimi-k2-thinking-128k"
Original file line number Diff line number Diff line change @@ -40,8 +40,25 @@ ffmpeg:
4040# Re-adding go2rtc with Nest cameras via Home Assistant API
4141# Using the correct echo:curl syntax from official documentation
4242go2rtc :
43+ # Nest configuration for direct access (lower latency)
44+ # Device IDs can be found in the go2rtc dashboard after restart
45+ nest :
46+ client_id : " ${NEST_CLIENT_ID}"
47+ client_secret : " ${NEST_CLIENT_SECRET}"
48+ project_id : " ${NEST_PROJECT_ID}"
49+ refresh_token : " ${NEST_REFRESH_TOKEN}"
50+
4351 streams :
44- # Nest cameras via Home Assistant (using HA's Nest integration)
52+ # --- Direct Nest Streams (Recommended) ---
53+ # Uncomment and replace <DEVICE_ID> with the ID from go2rtc dashboard
54+ # backyard-nest: "nest:<DEVICE_ID>"
55+ # garage-inside-nest: "nest:<DEVICE_ID>"
56+ # garage-outside-nest: "nest:<DEVICE_ID>"
57+ # front-porch-nest: "nest:<DEVICE_ID>"
58+ # living-room-nest: "nest:<DEVICE_ID>"
59+ # kitchen-nest: "nest:<DEVICE_ID>"
60+
61+ # --- Fallback: Nest cameras via Home Assistant Proxy ---
4562 backyard-nest :
4663 - " ffmpeg:http://home-assistant.home-assistant.svc.cluster.local:8123/api/camera_proxy_stream/camera.backyard_camera#video=copy#audio=copy#http_headers=Authorization: Bearer ${HA_TOKEN}"
4764 garage-inside-nest :
You can’t perform that action at this time.
0 commit comments