Skip to content

Commit 3b4007a

Browse files
committed
up
1 parent be9ecb1 commit 3b4007a

2 files changed

Lines changed: 109 additions & 24 deletions

File tree

my-apps/ai/llama-cpp/configmap.yaml

Lines changed: 91 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,11 @@ metadata:
55
namespace: llama-cpp
66
data:
77
config.yaml: |
8+
# Global settings
9+
healthCheckTimeout: 1200
10+
logLevel: info
11+
startPort: 5800
12+
813
models:
914
kimi-k2-thinking-128k:
1015
cmd: >-
@@ -14,24 +19,27 @@ data:
1419
-b 4096
1520
-ub 4096
1621
-ngl 99
17-
-ot .ffn_(up)_exps.=CPU
22+
-ot ".ffn_(up)_exps.=CPU"
1823
--host 0.0.0.0
1924
--port ${PORT}
2025
--threads 52
2126
--threads-batch 28
22-
--flash-attn on
27+
-fa
2328
--cache-type-k q8_0
2429
--cache-type-v q8_0
2530
--parallel 2
2631
--special
2732
--no-warmup
28-
--temp 1.0
29-
--min-p 0.01
3033
--jinja
3134
--mlock
32-
gpu_mode: dual
33-
health_check_path: /health
34-
timeout: 1200s
35+
env:
36+
- "CUDA_VISIBLE_DEVICES=0,1"
37+
checkEndpoint: /health
38+
ttl: 0
39+
aliases:
40+
- "kimi-k2"
41+
- "kimi"
42+
3543
gpt-oss-20b-128k:
3644
cmd: >-
3745
/app/llama-server
@@ -44,19 +52,21 @@ data:
4452
--port ${PORT}
4553
--threads 48
4654
--threads-batch 24
47-
--flash-attn on
55+
-fa
4856
--cache-type-k q8_0
4957
--cache-type-v q8_0
5058
--parallel 2
5159
--special
5260
--no-warmup
53-
--temp 0.7
54-
--min-p 0.05
5561
--jinja
5662
--mlock
57-
gpu_mode: dual
58-
health_check_path: /health
59-
timeout: 720s
63+
env:
64+
- "CUDA_VISIBLE_DEVICES=0,1"
65+
checkEndpoint: /health
66+
ttl: 0
67+
aliases:
68+
- "gpt-oss"
69+
6070
qwen3-thinking-128k:
6171
cmd: >-
6272
/app/llama-server
@@ -69,20 +79,78 @@ data:
6979
--port ${PORT}
7080
--threads 48
7181
--threads-batch 24
72-
--flash-attn on
82+
-fa
7383
--cache-type-k q8_0
7484
--cache-type-v q8_0
7585
--parallel 2
7686
--special
7787
--no-warmup
78-
--temp 0.6
79-
--min-p 0.05
8088
--jinja
8189
--mlock
82-
gpu_mode: dual
83-
health_check_path: /health
84-
timeout: 720s
85-
default_model: kimi-k2-thinking-128k
86-
health_check_interval: 60s
87-
swap_timeout: 600s
88-
cleanup_timeout: 120s
90+
env:
91+
- "CUDA_VISIBLE_DEVICES=0,1"
92+
checkEndpoint: /health
93+
ttl: 0
94+
aliases:
95+
- "qwen3-thinking"
96+
- "qwen3"
97+
98+
qwen3-coder-q8:
99+
cmd: >-
100+
/app/llama-server
101+
-m /models/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL.gguf
102+
-c 65536
103+
-b 4096
104+
-ub 4096
105+
-ngl 99
106+
--host 0.0.0.0
107+
--port ${PORT}
108+
--threads 48
109+
--threads-batch 24
110+
-fa
111+
--cache-type-k q8_0
112+
--cache-type-v q8_0
113+
--parallel 2
114+
--special
115+
--no-warmup
116+
--jinja
117+
--mlock
118+
env:
119+
- "CUDA_VISIBLE_DEVICES=0,1"
120+
checkEndpoint: /health
121+
ttl: 0
122+
aliases:
123+
- "qwen3-coder"
124+
- "coder"
125+
126+
magistral-small:
127+
cmd: >-
128+
/app/llama-server
129+
-m /models/Magistral-Small-2509-UD-Q8_K_XL.gguf
130+
-c 65536
131+
-b 4096
132+
-ub 4096
133+
-ngl 99
134+
--host 0.0.0.0
135+
--port ${PORT}
136+
--threads 48
137+
--threads-batch 24
138+
-fa
139+
--cache-type-k q8_0
140+
--cache-type-v q8_0
141+
--parallel 2
142+
--special
143+
--no-warmup
144+
--jinja
145+
--mlock
146+
env:
147+
- "CUDA_VISIBLE_DEVICES=0,1"
148+
checkEndpoint: /health
149+
ttl: 0
150+
aliases:
151+
- "magistral"
152+
153+
hooks:
154+
on_startup:
155+
preload:
156+
- "kimi-k2-thinking-128k"

my-apps/home/frigate/config.yml

Lines changed: 18 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -40,8 +40,25 @@ ffmpeg:
4040
# Re-adding go2rtc with Nest cameras via Home Assistant API
4141
# Using the correct echo:curl syntax from official documentation
4242
go2rtc:
43+
# Nest configuration for direct access (lower latency)
44+
# Device IDs can be found in the go2rtc dashboard after restart
45+
nest:
46+
client_id: "${NEST_CLIENT_ID}"
47+
client_secret: "${NEST_CLIENT_SECRET}"
48+
project_id: "${NEST_PROJECT_ID}"
49+
refresh_token: "${NEST_REFRESH_TOKEN}"
50+
4351
streams:
44-
# Nest cameras via Home Assistant (using HA's Nest integration)
52+
# --- Direct Nest Streams (Recommended) ---
53+
# Uncomment and replace <DEVICE_ID> with the ID from go2rtc dashboard
54+
# backyard-nest: "nest:<DEVICE_ID>"
55+
# garage-inside-nest: "nest:<DEVICE_ID>"
56+
# garage-outside-nest: "nest:<DEVICE_ID>"
57+
# front-porch-nest: "nest:<DEVICE_ID>"
58+
# living-room-nest: "nest:<DEVICE_ID>"
59+
# kitchen-nest: "nest:<DEVICE_ID>"
60+
61+
# --- Fallback: Nest cameras via Home Assistant Proxy ---
4562
backyard-nest:
4663
- "ffmpeg:http://home-assistant.home-assistant.svc.cluster.local:8123/api/camera_proxy_stream/camera.backyard_camera#video=copy#audio=copy#http_headers=Authorization: Bearer ${HA_TOKEN}"
4764
garage-inside-nest:

0 commit comments

Comments
 (0)