1- shim-version : v0.1.9 @sha256:410510c9e8e4c7489dd201fede302dee8455075ca28f4f0abbf84bded943b8f1
2- cvm-version : 0.4.1
1+ shim-version : v0.2.15 @sha256:5ca748b384b78b7e686b57ca66d9b3c552038ebab2ce60305004f76e573a8458
2+ cvm-version : 0.4.16
33cpus : 32
44memory : 524288
55gpus : full
6- vllm : false
76
87models :
98 - name : " qwen3-coder-480b"
10- repo : " Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8@d27784dcbed3a08de523dd74fadff2deb6fedc6b "
11- mpk : " bc59459fc1a03ec26049d01854bbb095313f30f4070138a02b33ee653f3bee28_482171310080_d5607439-fe26-5b91-a0c3-4e66642aaea6 "
9+ repo : " Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8@003f183a92fbe5b9a8325aaa8b2ae797c91dd90f "
10+ mpk : " 81993809d5510f60b216a144a27d4a2ca1df6b5ddaa6b7f0096a040bb5b1bf07_482171310080_b7089f0d-7aa8-508f-a7f2-10d8bf7001c8 "
1211
1312containers :
1413 - name : " qwen3-coder-480b"
@@ -17,26 +16,25 @@ containers:
1716 " --runtime" , "nvidia",
1817 " --gpus" , "all",
1918 " --ipc" , "host",
20- " vllm/vllm-openai:v0.10.0" ,
21- " --model" , "/tinfoil/mpk/mpk-bc59459fc1a03ec26049d01854bbb095313f30f4070138a02b33ee653f3bee28",
22- " --tensor-parallel-size" , "8",
23- " --gpu-memory-utilization" , "0.95",
19+ " vllm/vllm-openai:v0.12.0@sha256:6766ce0c459e24b76f3e9ba14ffc0442131ef4248c904efdcbf0d89e38be01fe" ,
20+ " --model" , "/tinfoil/mpk/mpk-81993809d5510f60b216a144a27d4a2ca1df6b5ddaa6b7f0096a040bb5b1bf07",
21+ " --enable-expert-parallel" ,
22+ " --data-parallel-size" , "8",
23+ " --max-model-len" , "131072",
2424 " --enable-auto-tool-choice" ,
2525 " --tool-call-parser" , "qwen3_coder",
26+ " --chat-template" , "examples/tool_chat_template_qwen3coder.jinja",
2627 " --served-model-name" , "qwen3-coder-480b",
2728 " --port" , "8001"
2829 ]
2930
3031shim :
3132 listen-port : 443
3233 upstream-port : 8001
33- publish-attestation : false
34+ publish-attestation : true
3435 tls-challenge : dns
3536 control-plane : https://api.tinfoil.sh
3637 paths :
3738 - /v1/chat/completions
3839 - /metrics
39- origins :
40- - https://tinfoil.sh
41- - https://chat.tinfoil.sh
42- - http://localhost:3000
40+ - /health
0 commit comments