Skip to content

Commit 8f6448e

Browse files
committed
feat: update qwen3-coder configs
1 parent 6f58fc6 commit 8f6448e

File tree

2 files changed

+14
-16
lines changed

2 files changed

+14
-16
lines changed

.github/workflows/build.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@ jobs:
1616

1717
steps:
1818
- uses: actions/checkout@v4
19-
- uses: tinfoilsh/pri-build-action@v0.4.0
19+
- uses: tinfoilsh/pri-build-action@v0.5.5
2020
with:
2121
config-file: ${{ github.workspace }}/tinfoil-config.yml
22-
github-token: ${{ secrets.GITHUB_TOKEN }}
22+
github-token: ${{ secrets.GITHUB_TOKEN }}

tinfoil-config.yml

Lines changed: 12 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -1,14 +1,13 @@
1-
shim-version: v0.1.9@sha256:410510c9e8e4c7489dd201fede302dee8455075ca28f4f0abbf84bded943b8f1
2-
cvm-version: 0.4.1
1+
shim-version: v0.2.15@sha256:5ca748b384b78b7e686b57ca66d9b3c552038ebab2ce60305004f76e573a8458
2+
cvm-version: 0.4.16
33
cpus: 32
44
memory: 524288
55
gpus: full
6-
vllm: false
76

87
models:
98
- name: "qwen3-coder-480b"
10-
repo: "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8@d27784dcbed3a08de523dd74fadff2deb6fedc6b"
11-
mpk: "bc59459fc1a03ec26049d01854bbb095313f30f4070138a02b33ee653f3bee28_482171310080_d5607439-fe26-5b91-a0c3-4e66642aaea6"
9+
repo: "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8@003f183a92fbe5b9a8325aaa8b2ae797c91dd90f"
10+
mpk: "81993809d5510f60b216a144a27d4a2ca1df6b5ddaa6b7f0096a040bb5b1bf07_482171310080_b7089f0d-7aa8-508f-a7f2-10d8bf7001c8"
1211

1312
containers:
1413
- name: "qwen3-coder-480b"
@@ -17,26 +16,25 @@ containers:
1716
"--runtime", "nvidia",
1817
"--gpus", "all",
1918
"--ipc", "host",
20-
"vllm/vllm-openai:v0.10.0",
21-
"--model", "/tinfoil/mpk/mpk-bc59459fc1a03ec26049d01854bbb095313f30f4070138a02b33ee653f3bee28",
22-
"--tensor-parallel-size", "8",
23-
"--gpu-memory-utilization", "0.95",
19+
"vllm/vllm-openai:v0.12.0@sha256:6766ce0c459e24b76f3e9ba14ffc0442131ef4248c904efdcbf0d89e38be01fe",
20+
"--model", "/tinfoil/mpk/mpk-81993809d5510f60b216a144a27d4a2ca1df6b5ddaa6b7f0096a040bb5b1bf07",
21+
"--enable-expert-parallel",
22+
"--data-parallel-size", "8",
23+
"--max-model-len", "131072",
2424
"--enable-auto-tool-choice",
2525
"--tool-call-parser", "qwen3_coder",
26+
"--chat-template", "examples/tool_chat_template_qwen3coder.jinja",
2627
"--served-model-name", "qwen3-coder-480b",
2728
"--port", "8001"
2829
]
2930

3031
shim:
3132
listen-port: 443
3233
upstream-port: 8001
33-
publish-attestation: false
34+
publish-attestation: true
3435
tls-challenge: dns
3536
control-plane: https://api.tinfoil.sh
3637
paths:
3738
- /v1/chat/completions
3839
- /metrics
39-
origins:
40-
- https://tinfoil.sh
41-
- https://chat.tinfoil.sh
42-
- http://localhost:3000
40+
- /health

0 commit comments

Comments
 (0)