Skip to content

Commit 8b32dab

Browse files
feature: add qwen3 series to PR CI (#458)
1 parent d381f5f commit 8b32dab

1 file changed

Lines changed: 13 additions & 0 deletions

File tree

.github/workflows/rbln_optimum_ci.yaml

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -115,6 +115,19 @@ jobs:
115115
else
116116
uv pip install --system --force-reinstall --no-cache-dir dist/vllm_rbln*.whl --index-url http://pypi-cache.devpi.svc.cluster.local/root/pypi/+simple/ --extra-index-url https://wheels.vllm.ai/0.13.0/cpu --extra-index-url https://download.pytorch.org/whl/cpu --index-strategy unsafe-best-match
117117
fi
118+
119+
- name : Run Qwen3-embedding (V1)
120+
run: >
121+
python3 examples/optimum/run_qwen3_embedding.py
122+
--num_input_prompt $((2 * ${{ env.NUM_INPUT_PROMPT }}))
123+
--model_id ${{ env.REBEL_VLLM_PRE_COMPILED_DIR }}/qwen3-embedding-0_6b-32k_kv4k_batch1
124+
125+
- name : Run Qwen3-reranker (V1)
126+
run: >
127+
python3 examples/optimum/run_qwen3_reranker.py
128+
--max_seq_len 32768
129+
--num_input_prompt $((2 * ${{ env.NUM_INPUT_PROMPT }}))
130+
--model_id ${{ env.REBEL_VLLM_PRE_COMPILED_DIR }}/qwen3-reranker-0_6b-40k_kv4k_batch2
118131
119132
- name: Run gemma2 model (hybrid attention) (V1)
120133
run: >

0 commit comments

Comments
 (0)