NVIDIA
diff --git a/‎.github/workflows/mlir-tensorrt-build-test.yml‎
Lines changed: 2 additions & 2 deletions b/‎.github/workflows/mlir-tensorrt-build-test.yml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎.github/workflows/mlir-tensorrt-pypi.yml‎
Lines changed: 194 additions & 0 deletions b/‎.github/workflows/mlir-tensorrt-pypi.yml‎
Lines changed: 194 additions & 0 deletions
diff --git a/‎.github/workflows/mlir-tensorrt-release.yml‎
Lines changed: 2 additions & 2 deletions b/‎.github/workflows/mlir-tensorrt-release.yml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎.github/workflows/mlir-tensorrt/generate-matrix.py‎
Lines changed: 14 additions & 5 deletions b/‎.github/workflows/mlir-tensorrt/generate-matrix.py‎
Lines changed: 14 additions & 5 deletions
diff --git a/‎mlir-tensorrt/.devcontainer/cuda12.9-rockylinux8-prebuilt/devcontainer.json‎
Lines changed: 88 additions & 0 deletions b/‎mlir-tensorrt/.devcontainer/cuda12.9-rockylinux8-prebuilt/devcontainer.json‎
Lines changed: 88 additions & 0 deletions
@@ -4,7 +4,7 @@ on:
   workflow_call:
     inputs:
       channel:
-        description: 'Channel, valid values are "nightly", "test", or "release"'
+        description: 'Channel, valid values are "nightly", "test", "release" or "pypi-release"'
         default: "test"
         type: string
       build-matrix:
@@ -26,7 +26,7 @@ jobs:
     env:
       # eg. TENSORRT_VERSION: 10.12 or 10.13
       MLIR_TRT_DOWNLOAD_TENSORRT_VERSION: ${{ matrix.trt }}
-      # eg. CHANNEL: nightly, test or release
+      # eg. CHANNEL: nightly, test, release or pypi-release
       CHANNEL: ${{ inputs.channel }}
       ARCH: ${{ matrix.arch }}
       CMAKE_PRESET: ${{ matrix.cmake_preset }}
 
@@ -0,0 +1,194 @@
+name: MLIR-TensorRT PyPI Release CI
+
+on:
+  workflow_dispatch:
+    inputs:
+      confirm_publish_to_pypi:
+        description: 'I confirm that I have verified version to be published to pypi.org'
+        required: true
+        type: boolean
+        default: false
+
+defaults:
+  run:
+    shell: bash
+
+jobs:
+  generate-matrix:
+    name: Generate Build Matrix (pypi-release)
+    runs-on: ubuntu-latest
+    outputs:
+      matrix: ${{ steps.generate-matrix.outputs.matrix }}
+    steps:
+      - uses: actions/checkout@v6
+        with:
+          fetch-depth: 5
+      - name: Generate Build Matrix
+        id: generate-matrix
+        run: |
+          set -euo pipefail
+          set -x
+          MATRIX_BLOB="$(python3 ./.github/workflows/mlir-tensorrt/generate-matrix.py --channel pypi-release)"
+          echo "${MATRIX_BLOB}"
+          echo "matrix=${MATRIX_BLOB}" >> "${GITHUB_OUTPUT}"
+
+  pypi-release-wheels-build:
+    name: ${{ matrix.arch}} - Build PyPI Release Wheels
+    needs:
+      - generate-matrix
+    permissions:
+      id-token: write
+      packages: write
+      contents: read
+    strategy:
+      matrix: ${{ fromJSON(needs.generate-matrix.outputs.matrix) }}
+    runs-on: ${{ matrix.github_runner }}
+    env:
+      MLIR_TRT_DOWNLOAD_TENSORRT_VERSION: ${{ matrix.trt }}
+      CMAKE_PRESET: ${{ matrix.cmake_preset }}
+      CCACHE_RESTORE_KEY: mlir-tensorrt-ccache-v1-${{ matrix.arch }}-${{ matrix.cmake_preset }}
+      CPM_RESTORE_KEY: mlir-tensorrt-cpm-v1
+    timeout-minutes: 120
+    container:
+      # pypi audit wheel repair requires rockylinux8
+      image: ${{ matrix.docker_image }}
+      options: >-
+        --gpus all
+        --shm-size=1g
+    steps:
+      - name: Checkout TensorRT-Incubator
+        uses: actions/checkout@v6
+        with:
+          fetch-depth: 5
+
+      - name: Create Cache Folders
+        run: |
+          set -euo pipefail
+          set -x
+          export CPM_SOURCE_CACHE=${GITHUB_WORKSPACE}/mlir-tensorrt/.cache.cpm
+          export CCACHE_DIR=${GITHUB_WORKSPACE}/mlir-tensorrt/ccache
+
+          echo "CPM_SOURCE_CACHE=$CPM_SOURCE_CACHE" >> "$GITHUB_ENV"
+          echo "CCACHE_DIR=$CCACHE_DIR" >> "$GITHUB_ENV"
+
+          mkdir -p ${CCACHE_DIR}
+          mkdir -p ${CPM_SOURCE_CACHE}
+
+      - name: Compute CCache Key
+        id: ccache-key
+        run: |
+          hash=$( (find mlir-tensorrt/compiler \
+                        mlir-tensorrt/common \
+                        mlir-tensorrt/kernel \
+                        mlir-tensorrt/tensorrt \
+                        mlir-tensorrt/integrations \
+                        mlir-tensorrt/executor \
+                   -type f \( -name '*.cpp' -o -name '*.h' \) \
+                   -exec sha256sum {} \; ; \
+                  sha256sum mlir-tensorrt/DependencyProvider.cmake \
+                            mlir-tensorrt/CMakeLists.txt) \
+                 | sort | sha256sum | cut -d' ' -f1)
+          echo "key=${{ env.CCACHE_RESTORE_KEY }}-${hash}" >> $GITHUB_OUTPUT
+
+      - name: Compute CPM Key
+        id: cpm-key
+        run: |
+          hash=$(sha256sum mlir-tensorrt/DependencyProvider.cmake | cut -d' ' -f1)
+          echo "key=${{ env.CPM_RESTORE_KEY }}-${hash}" >> $GITHUB_OUTPUT
+
+      - name: Restore CCache
+        id: restore-ccache
+        uses: actions/cache/restore@v4
+        with:
+          key: ${{ steps.ccache-key.outputs.key }}
+          restore-keys: |
+            ${{ env.CCACHE_RESTORE_KEY }}
+          path: |
+            ${{ env.CCACHE_DIR }}
+
+      - name: Restore CPM cache
+        id: restore-cpm
+        uses: actions/cache/restore@v4
+        with:
+          key: ${{ steps.cpm-key.outputs.key }}
+          enableCrossOsArchive: true
+          restore-keys: |
+            ${{ env.CPM_RESTORE_KEY }}
+          path: |
+            mlir-tensorrt/.cache.cpm/*
+            !mlir-tensorrt/.cache.cpm/tensorrt
+            !mlir-tensorrt/.cache.cpm/tensorrt/**
+
+      - name: Build Wheels With CUDA:${{ matrix.cuda }} + TensorRT:${{ matrix.trt }}
+        env:
+          MLIR_TRT_DOWNLOAD_TENSORRT_VERSION: ${{ matrix.trt }}
+          ARCH: ${{ matrix.arch }}
+          CMAKE_PRESET: distribution-wheels
+        run: |
+          set -euo pipefail
+          set -x
+          cd mlir-tensorrt
+          # Build only pjrt wheels for PyPI upload, with auditwheel repair
+          MLIR_TRT_PYPI=1 PACKAGES="pjrt" ./build_tools/scripts/cicd-build-wheels.sh
+
+      - name: Upload Wheels
+        uses: actions/upload-artifact@v4
+        with:
+          name: release-wheels-${{ matrix.arch }}-cu${{ matrix.cuda }}-trt${{ matrix.trt }}
+          path: mlir-tensorrt/dist
+          if-no-files-found: error
+
+  test-pypi-release-wheels-publish:
+    name: Publish to TestPyPI
+    needs: [pypi-release-wheels-build]
+    runs-on: ubuntu-latest
+    environment:
+      name: testpypi
+      url: https://test.pypi.org/project/mlir-tensorrt-jax/
+    permissions:
+      id-token: write
+      packages: write
+      contents: read
+    steps:
+      - name: Download built wheels
+        uses: actions/download-artifact@v4
+        with:
+          pattern: release-wheels-*
+          merge-multiple: true
+          path: dist
+
+      - name: Publish to TestPyPI
+        uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          skip-existing: true
+          verbose: true
+          repository-url: https://test.pypi.org/legacy/
+
+  pypi-release-wheels-publish:
+    name: Publish to PyPI
+    if: ${{ inputs.confirm_publish_to_pypi }}
+    needs: [pypi-release-wheels-build]
+    runs-on: ubuntu-latest
+    permissions:
+      id-token: write
+      packages: write
+      contents: read
+    steps:
+      - name: Download built wheels
+        uses: actions/download-artifact@v4
+        with:
+          pattern: release-wheels-*
+          merge-multiple: true
+          path: dist
+
+      - name: Publish to PyPI
+        uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          verbose: true
+          skip-existing: true
+          user: __token__
+          password: ${{ secrets.PYPI_API_TOKEN }}
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref_name }}-mlir-tensorrt-pypi
+  cancel-in-progress: true
@@ -23,8 +23,8 @@ jobs:
       # eg. 10.12 or 10.13
       MLIR_TRT_DOWNLOAD_TENSORRT_VERSION: ${{ matrix.trt }}
       ARCH: ${{ matrix.arch }}
-      CMAKE_PRESET: distribution-wheels
-      CCACHE_RESTORE_KEY: mlir-tensorrt-ccache-v1-${{ matrix.arch }}-distribution-wheels
+      CMAKE_PRESET: ${{ matrix.cmake_preset }}
+      CCACHE_RESTORE_KEY: mlir-tensorrt-ccache-v1-${{ matrix.arch }}-${{ matrix.cmake_preset }}
       CPM_RESTORE_KEY: mlir-tensorrt-cpm-v1
     runs-on: ${{ matrix.github_runner }}
     timeout-minutes: 120
 
@@ -31,12 +31,19 @@
             "trt": "10.13",
         },
     ],
+    "pypi-release": [
+        {
+            "cuda": "13.0",
+            "trt": "10.13",
+        },
+    ],
 }
 
 ARCH_LIST_DICT = {
     "test": ["x86_64"],
     "release": ["x86_64", "aarch64"],
     "nightly": ["x86_64", "aarch64"],
+    "pypi-release": ["x86_64", "aarch64"],
 }
 
 GH_RUNNER_DICT = {
@@ -47,9 +54,8 @@
 CMAKE_PRESET_DICT = {
     "nightly": "github-cicd",
     "test": "github-cicd",
-    # release should use the release wheel build preset
-    # TODO: add the release wheel build preset
-    "release": "github-cicd",
+    "release": "distribution-wheels",
+    "pypi-release": "distribution-wheels",
 }
 
 DOCKER_IMAGE_DICT = {
@@ -71,6 +77,9 @@
             "13.0": "ghcr.io/nvidia/tensorrt-incubator/mlir-tensorrt:cuda13.0-rockylinux9-0.1",
         },
     },
+    "pypi-release": {
+        "13.0": "ghcr.io/nvidia/tensorrt-incubator/mlir-tensorrt:cuda13.0-rockylinux8-0.1",
+    },
 }
 
 
@@ -84,9 +93,9 @@ def main(args: list[str]) -> None:
     )
 
     options = parser.parse_args(args)
-    if options.channel not in ("nightly", "test", "release"):
+    if options.channel not in ("nightly", "test", "release", "pypi-release"):
         raise Exception(
-            "--channel is invalid, please choose from nightly, test or release"
+            "--channel is invalid, please choose from nightly, test, release or pypi-release"
         )
 
     channel = options.channel
 
@@ -0,0 +1,88 @@
+{
+  "name": "cuda12.9-rockylinux8-prebuilt",
+  "image": "ghcr.io/nvidia/tensorrt-incubator/mlir-tensorrt:cuda12.9-rockylinux8-0.1",
+  "remoteUser": "nvidia",
+  "updateRemoteUserUID": true,
+  "runArgs": [
+    "--name",
+    "cuda12.9-rockylinux8-prebuilt-${localEnv:USER:nvidia}-${devcontainerId}",
+    "--cap-add=SYS_PTRACE",
+    "--security-opt",
+    "seccomp=unconfined",
+    "--shm-size=1g",
+    "--ulimit",
+    "memlock=-1",
+    "--network=host"
+  ],
+  "hostRequirements": {
+    "gpu": "optional"
+  },
+  "workspaceMount": "source=${localWorkspaceFolder}/..,target=/workspaces/TensorRT-Incubator,type=bind,consistency=cached",
+  "workspaceFolder": "/workspaces/TensorRT-Incubator/mlir-tensorrt",
+  "customizations": {
+    "vscode": {
+      "extensions": [
+        "llvm-vs-code-extensions.vscode-clangd",
+        "llvm-vs-code-extensions.vscode-mlir",
+        "eamodio.gitlens",
+        "ms-python.black-formatter",
+        "ms-python.python"
+      ],
+      "settings": {
+        "[python]": {
+          "editor.defaultFormatter": "ms-python.black-formatter"
+        },
+        "mlir.pdll_compilation_databases": [
+          "build/pdll_compile_commands.yml"
+        ],
+        "mlir.server_path": "build/bin/mlir-tensorrt-lsp-server",
+        "files.exclude": {
+          "**/.git": true,
+          "**/.cache": true,
+          "**/.venv*": true
+        },
+        "files.watcherExclude": {
+          "**/.git/objects/**": true,
+          "**/.git/subtree-cache/**": true,
+          "**/.private*": true,
+          "**/.venv*/**": true,
+          "**/build/**": true
+        },
+        "search.exclude": {
+          "**/.private*": true,
+          "**/.venv*": true,
+          "**/build": true
+        },
+        "python.analysis.include": [
+          "integrations/python",
+          "integrations/python/internal"
+        ],
+        "python.analysis.typeCheckingMode": "basic",
+        "python.analysis.extraPaths": [
+          "build/python_packages/mlir_tensorrt_compiler",
+          "build/python_packages/mlir_tensorrt_runtime",
+          "build/python_packages/tools"
+        ],
+        "python.analysis.exclude": [
+          "**/build/**",
+          "**/.cache.cpm/**",
+          "**/*bazel*/**",
+          "**/build_tools/**",
+          "third_party"
+        ]
+      }
+    }
+  },
+  "features": {
+    "ghcr.io/devcontainers/features/common-utils:2": {
+      "installZsh": true,
+      "installOhMyZsh": true,
+      "configureZshAsDefaultShell": false,
+      "upgradePackages": false,
+      "username": "nvidia",
+      "userUid": "automatic",
+      "userGid": "automatic"
+    },
+    "ghcr.io/devcontainers/features/git:1": {}
+  }
+}