File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 3737 env :
3838 OPENAI_KEY : ${{ env.SDSC_VLLM_TOKEN }}
3939 GITHUB_TOKEN : ${{ secrets.GITHUB_TOKEN }}
40- config__model : " openai/Qwen /Qwen3-Coder-30B-A3B-Instruct-FP8 "
41- config__fallback_models : ' ["openai/Qwen /Qwen3-Coder-30B-A3B-Instruct-FP8 "]'
42- config__custom_model_max_tokens : " 32000 "
40+ config__model : " openai/cyankiwi /Qwen3-Coder-30B-A3B-Instruct-AWQ-Int4 "
41+ config__fallback_models : ' ["openai/cyankiwi /Qwen3-Coder-30B-A3B-Instruct-AWQ-Int4 "]'
42+ config__custom_model_max_tokens : " 192000 "
4343 config__ai_timeout : " 1800"
4444 openai__extra_body : ' {"chat_template_kwargs":{"enable_thinking":false}}'
4545 OPENAI__API_BASE : " https://vllm-gateway-runai-sharedllm-ralf.inference.compute.datascience.ch/v1"
5555 # env:
5656 # # --- LLM configuration ---
5757 # LLM__PROVIDER: "OPENAI"
58- # LLM__META__MODEL: "Qwen /Qwen3-Coder-30B-A3B-Instruct-FP8 "
59- # LLM__META__MAX_TOKENS: "16000 "
58+ # LLM__META__MODEL: "cyankiwi /Qwen3-Coder-30B-A3B-Instruct-AWQ-Int4 "
59+ # LLM__META__MAX_TOKENS: "192000 "
6060 # LLM__HTTP_CLIENT__API_URL: "https://vllm-gateway-runai-sharedllm-ralf.inference.compute.datascience.ch/v1"
6161 # LLM__HTTP_CLIENT__API_TOKEN: ${{ env.SDSC_VLLM_TOKEN }}
6262
You can’t perform that action at this time.
0 commit comments