ci: add vllm action and integration to image test

nathan-weinberg · derekhiggins · nathan-weinberg · commit d807db07a3e1 · 2025-09-04T11:25:13.000-04:00
Co-authored-by: Derek Higgins &lt;derekh@redhat.com&gt;
Signed-off-by: Nathan Weinberg &lt;nweinber@redhat.com&gt;
diff --git a/.github/actions/setup-vllm/action.yml b/.github/actions/setup-vllm/action.yml
@@ -0,0 +1,27 @@
+name: Setup VLLM
+description: Start VLLM
+runs:
+  using: "composite"
+  steps:
+    - name: Start VLLM
+      shell: bash
+      run: |
+        # Start vllm container
+        docker run -d \
+          --name vllm \
+          -p 8000:8000 \
+          --privileged=true \
+          quay.io/higginsd/vllm-cpu:65393ee064 \
+          --host 0.0.0.0 \
+          --port 8000 \
+          --enable-auto-tool-choice \
+          --tool-call-parser llama3_json \
+          --model /root/.cache/Llama-3.2-1B-Instruct \
+          --served-model-name meta-llama/Llama-3.2-1B-Instruct
+
+          # Wait for vllm to be ready
+          echo "Waiting for vllm to be ready..."
+          timeout 900 bash -c 'until curl -f http://localhost:8000/health; do
+            echo "Waiting for vllm..."
+            sleep 5
+          done'
diff --git a/.github/workflows/redhat-distro-container.yml b/.github/workflows/redhat-distro-container.yml
@@ -50,14 +50,18 @@ jobs:
           cache-from: type=gha
           cache-to: type=gha,mode=max
 
+      - name: Setup vllm for image test
+        id: vllm
+        uses: ./.github/actions/setup-vllm
+
       - name: Test image
         id: test
         run: |
           set -euo pipefail
           # Start llama stack
           CID="$(docker run -d --pull=never \
             -p 8321:8321 \
-            --env INFERENCE_MODEL=dummy \
+            --env INFERENCE_MODEL=meta-llama/Llama-3.2-1B-Instruct \
             --name llama-stack \
             ${{ env.IMAGE_NAME }}:${{ github.sha }})"
           trap 'docker rm -f "$CID" >/dev/null 2>&1 || true' EXIT