Skip to content

Change tests to use rocm 6.3 version and tol changes to make liger run on amd #860

Change tests to use rocm 6.3 version and tol changes to make liger run on amd

Change tests to use rocm 6.3 version and tol changes to make liger run on amd #860

Workflow file for this run

name: AMD GPU
on:
push:
branches:
- main
paths:
- "src/**"
- "test/**"
pull_request:
branches:
- main
paths:
- "src/**"
- "test/**"
schedule:
# Runs at 00:00 UTC daily
- cron: '0 0 * * *'
workflow_dispatch: # Enables manual trigger
concurrency:
# This causes it to cancel previous in-progress actions on the same PR / branch,
group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
cancel-in-progress: true
jobs:
checkstyle:
runs-on: ubuntu-latest
steps:
- name: Checkout code
uses: actions/checkout@v3
- name: Set up Python
uses: actions/setup-python@v3
with:
python-version: '3.10'
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install -r dev/fmt-requirements.txt
- name: Run checkstyle
run: make checkstyle
tests:
runs-on: linux-mi300-gpu-1
needs: [checkstyle]
strategy:
matrix:
rocm_version: ['6.3']
steps:
- name: Checkout code
uses: actions/checkout@v3
- name: Set up Python
uses: actions/setup-python@v3
with:
python-version: '3.10'
- name: Setup Dependencies
run: |
rocm-smi
python -m pip install --upgrade pip
pip install -e .[dev] --extra-index-url https://download.pytorch.org/whl/nightly/rocm${{ matrix.rocm_version }}
- name: List Python Environments
run: python -m pip list
- name: Run Unit Tests
run: |
make test
make test-convergence