feature: add qwen3 series to PR CI (#458)

rebel-seinpark · web-flow · commit 8b32dabf8c4c · 2026-03-16T18:43:27.000+09:00
diff --git a/.github/workflows/rbln_optimum_ci.yaml b/.github/workflows/rbln_optimum_ci.yaml
@@ -115,6 +115,19 @@ jobs:
             else
               uv pip install --system --force-reinstall --no-cache-dir dist/vllm_rbln*.whl --index-url http://pypi-cache.devpi.svc.cluster.local/root/pypi/+simple/ --extra-index-url https://wheels.vllm.ai/0.13.0/cpu --extra-index-url https://download.pytorch.org/whl/cpu --index-strategy unsafe-best-match
             fi
+      
+      - name : Run Qwen3-embedding (V1)
+        run: >
+          python3 examples/optimum/run_qwen3_embedding.py
+          --num_input_prompt $((2 * ${{ env.NUM_INPUT_PROMPT }}))
+          --model_id ${{ env.REBEL_VLLM_PRE_COMPILED_DIR }}/qwen3-embedding-0_6b-32k_kv4k_batch1
+
+      - name : Run Qwen3-reranker (V1)
+        run: >
+          python3 examples/optimum/run_qwen3_reranker.py
+          --max_seq_len 32768
+          --num_input_prompt $((2 * ${{ env.NUM_INPUT_PROMPT }}))
+          --model_id ${{ env.REBEL_VLLM_PRE_COMPILED_DIR }}/qwen3-reranker-0_6b-40k_kv4k_batch2
 
       - name: Run gemma2 model (hybrid attention) (V1)
         run: >