Skip to content

feat(llmisvc): add Intel Gaudi accelerator LLMInferenceServiceConfig … #1

feat(llmisvc): add Intel Gaudi accelerator LLMInferenceServiceConfig …

feat(llmisvc): add Intel Gaudi accelerator LLMInferenceServiceConfig … #1

name: Predictive Server Docker Publisher
on:
push:
# Publish `master` as Docker `latest` image.
branches:
- master
# Publish `v1.2.3` tags as releases.
tags:
- v*
# Run tests for any PRs.
pull_request:
paths:
- "python/**"
- "!.github/**"
- "!docs/**"
- "!**.md"
- ".github/workflows/predictiveserver-docker-publish.yml"
- ".github/actions/free-up-disk-space/**"
# To save some compute time, rely on PR check and don't run for merge queues
# merge_group:
# types: [ checks_requested ]
env:
IMAGE_NAME: predictiveserver
concurrency:
group: ${{ github.workflow }}-${{ github.ref }}
cancel-in-progress: true
jobs:
# Run tests.
# See also https://docs.docker.com/docker-hub/builds/automated-testing/
test:
runs-on: ubuntu-latest
steps:
- name: Checkout source
uses: actions/checkout@v4
- name: Merge target branch
if: github.event_name == 'pull_request'
run: |
git fetch --unshallow origin
git fetch origin ${{ github.event.pull_request.base.ref }}
git config user.email "ci@kserve.io"
git config user.name "CI Bot"
git merge --no-edit origin/${{ github.event.pull_request.base.ref }}
- name: Free-up disk space
uses: ./.github/actions/free-up-disk-space
- name: Setup QEMU
uses: docker/setup-qemu-action@v3
with:
cache-image: true
- name: Setup Docker Buildx
uses: docker/setup-buildx-action@v3
with:
cache-binary: true
- name: Run tests
uses: docker/build-push-action@v6
with:
platforms: linux/amd64,linux/arm64/v8
context: python
file: python/predictiveserver.Dockerfile
push: false
# https://github.com/docker/buildx/issues/1533
provenance: false
# Push image to GitHub Packages.
# See also https://docs.docker.com/docker-hub/builds/
push:
# Ensure test job passes before pushing image.
needs: test
runs-on: ubuntu-latest
if: github.event_name == 'push'
steps:
- name: Checkout source
uses: actions/checkout@v4
- name: Free-up disk space
uses: ./.github/actions/free-up-disk-space
- name: Setup QEMU
uses: docker/setup-qemu-action@v3
with:
cache-image: true
- name: Setup Docker Buildx
uses: docker/setup-buildx-action@v3
with:
cache-binary: true
- name: Login to DockerHub
uses: docker/login-action@v3
with:
username: ${{ secrets.DOCKER_USER }}
password: ${{ secrets.DOCKER_PASSWORD }}
- name: Export version variable
run: |
IMAGE_ID=kserve/$IMAGE_NAME
# Change all uppercase to lowercase
IMAGE_ID=$(echo $IMAGE_ID | tr '[A-Z]' '[a-z]')
# Strip git ref prefix from version
VERSION=$(echo "${{ github.ref }}" | sed -e 's,.*/\(.*\),\1,')
# Strip "v" prefix from tag name
# [[ "${{ github.ref }}" == "refs/tags/"* ]] && VERSION=$(echo $VERSION | sed -e 's/^v//')
# Use Docker `latest` tag convention
[ "$VERSION" == "master" ] && VERSION=latest
echo VERSION=$VERSION >> $GITHUB_ENV
echo IMAGE_ID=$IMAGE_ID >> $GITHUB_ENV
- name: Build and push
uses: docker/build-push-action@v6
with:
platforms: linux/amd64,linux/arm64/v8
context: python
file: python/predictiveserver.Dockerfile
push: true
tags: ${{ env.IMAGE_ID }}:${{ env.VERSION }}
# https://github.com/docker/buildx/issues/1533
provenance: false