NVIDIA
diff --git a/‎.github/workflows/mlir-tensorrt-build-test.yml‎
Lines changed: 1 addition & 0 deletions b/‎.github/workflows/mlir-tensorrt-build-test.yml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎.github/workflows/mlir-tensorrt-ci.yml‎
Lines changed: 38 additions & 12 deletions b/‎.github/workflows/mlir-tensorrt-ci.yml‎
Lines changed: 38 additions & 12 deletions
diff --git a/‎.github/workflows/mlir-tensorrt-release.yml‎
Lines changed: 152 additions & 0 deletions b/‎.github/workflows/mlir-tensorrt-release.yml‎
Lines changed: 152 additions & 0 deletions
diff --git a/‎.github/workflows/mlir-tensorrt/generate-matrix.py‎
Lines changed: 30 additions & 0 deletions b/‎.github/workflows/mlir-tensorrt/generate-matrix.py‎
Lines changed: 30 additions & 0 deletions
diff --git a/‎mlir-tensorrt/.clang-format-ignore‎
Lines changed: 1 addition & 0 deletions b/‎mlir-tensorrt/.clang-format-ignore‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎mlir-tensorrt/CMakeLists.txt‎
Lines changed: 1 addition & 0 deletions b/‎mlir-tensorrt/CMakeLists.txt‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎mlir-tensorrt/CMakeOptions.cmake‎
Lines changed: 4 additions & 1 deletion b/‎mlir-tensorrt/CMakeOptions.cmake‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎mlir-tensorrt/Version.cmake‎
Lines changed: 8 additions & 0 deletions b/‎mlir-tensorrt/Version.cmake‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎mlir-tensorrt/build_tools/cmake/MTRTCommonFunctions.cmake‎
Lines changed: 2 additions & 0 deletions b/‎mlir-tensorrt/build_tools/cmake/MTRTCommonFunctions.cmake‎
Lines changed: 2 additions & 0 deletions
@@ -51,6 +51,7 @@ jobs:
       options: >-
         --gpus all
         --shm-size=1g
+    timeout-minutes: 120
     steps:
       # Checkout the repository
       - name: Checkout TensorRT-Incubator
 
@@ -7,16 +7,15 @@ on:
     branches:
       - "pull-request/[0-9]+"
       - "main"
-  # Disable the release and nightly CI for now, we will enable them later
-  #   # this is for release CI
-  #   tags:
-  #     # release tag example: v0.4.2
-  #     # release candidate tag example: v0.4.2-rc1
-  #     - v[0-9]+.[0-9]+.[0-9]+-rc[0-9]+
-  # workflow_dispatch:
-  # # this is for nightly CI, it will be automatically triggered by the schedule on main branch only
-  # schedule:
-  #   - cron: '0 0 * * *'  # Runs at 00:00 UTC every day (minute hour day-of-month month-of-year day-of-week)
+    # this is for release CI
+    tags:
+      # release tag example: v0.4.2
+      # release candidate tag example: v0.4.2-rc1
+      - v[0-9]+.[0-9]+.[0-9]+-rc[0-9]+
+  workflow_dispatch:
+  # this is for nightly CI, it will be automatically triggered by the schedule on main branch only
+  schedule:
+    - cron: '0 0 * * *'  # Runs at 00:00 UTC every day (minute hour day-of-month month-of-year day-of-week)
 
 env:
   DEFAULT_IMAGE: ghcr.io/nvidia/tensorrt-incubator/mlir-tensorrt:cuda12.9-ubuntu24.04-0.1
@@ -45,6 +44,12 @@ jobs:
           git config --global --add safe.directory "${GITHUB_WORKSPACE}"
 
           EVENT_NAME="${{ github.event_name }}"
+          REF_TYPE="${{ github.ref_type }}"
+          if [ "${EVENT_NAME}" = "schedule" || "${EVENT_NAME}" = "workflow_dispatch" || ${REF_TYPE} == 'tag' ]; then
+            echo "github.event_name: ${EVENT_NAME} or github.ref_type: ${REF_TYPE}"
+            echo "has_changes=true" >> "${GITHUB_OUTPUT}"
+            exit 0
+          fi
           DEFAULT_BASE="${{ github.event.repository.default_branch || 'main' }}"
           RANGE=""
           if [ "${EVENT_NAME}" = "push" ]; then
@@ -85,7 +90,7 @@ jobs:
   format-check:
     name: Lint Check
     needs: changes
-    if: ${{ needs.changes.outputs.has_changes == 'true' }}
+    if: ${{ needs.changes.outputs.has_changes == 'true' || github.event_name == 'schedule' || github.ref_type == 'tag' }}
     runs-on: ubuntu-latest
     container:
       image: ghcr.io/nvidia/tensorrt-incubator/mlir-tensorrt:cuda12.9-ubuntu24.04-0.1
@@ -170,7 +175,6 @@ jobs:
     needs:
       - changes
       - format-check
-      - mlir-tensorrt-build-test-x86_64
     if: ${{ needs.changes.outputs.has_changes == 'true' && needs.format-check.outputs.channel != 'release' }}
     uses: ./.github/workflows/mlir-tensorrt-build-test.yml
     with:
@@ -179,6 +183,28 @@ jobs:
       arch: aarch64
       github_runner: linux-arm64-gpu-l4-latest-1
 
+  mlir-tensorrt-wheel-tarball-release-x86_64:
+    name: Release on x86_64
+    needs:
+      - format-check
+    if: ${{ needs.format-check.outputs.channel == 'release' }}
+    uses: ./.github/workflows/mlir-tensorrt-release.yml
+    with:
+      build-matrix: ${{ needs.format-check.outputs.matrix }}
+      arch: x86_64
+      github_runner: linux-amd64-gpu-h100-latest-1
+
+  mlir-tensorrt-wheel-tarball-release-aarch64:
+    name: Release on aarch64
+    needs:
+      - format-check
+    if: ${{ needs.format-check.outputs.channel == 'release' }}
+    uses: ./.github/workflows/mlir-tensorrt-release.yml
+    with:
+      build-matrix: ${{ needs.format-check.outputs.matrix }}
+      arch: aarch64
+      github_runner: linux-arm64-gpu-l4-latest-1
+
 concurrency:
   group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref_name }}-mlir-tensorrt
   cancel-in-progress: true
 
@@ -0,0 +1,152 @@
+name: MLIR-TensorRT Release Wheel and Tarball
+
+on:
+  workflow_call:
+    inputs:
+      build-matrix:
+        description: 'Build matrix to utilize'
+        default: ""
+        type: string
+      arch:
+        description: 'Architecture, valid values are "x86_64" or "aarch64"'
+        default: "x86_64"
+        type: string
+      github_runner:
+        description: 'Runner, valid values are "linux-amd64-gpu-h100-latest-1" or "linux-arm64-gpu-l4-latest-1"'
+        default: "linux-amd64-gpu-h100-latest-1"
+        type: string
+
+defaults:
+  run:
+    shell: bash
+
+jobs:
+  mlir-tensorrt-wheel-build:
+    name: ${{ inputs.arch }}-cu${{ matrix.cuda }}-trt${{ matrix.trt }}-wheel-build
+    strategy:
+      fail-fast: false
+      max-parallel: 1
+      matrix: ${{ fromJSON(inputs.build-matrix) }}
+    env:
+      # eg. 10.12 or 10.13
+      DOWNLOAD_TENSORRT_VERSION: ${{ matrix.trt }}
+      LATEST_CUDA_VERSION: ${{ matrix.latest_cuda }}
+      LATEST_TENSORRT_VERSION: ${{ matrix.latest_trt }}
+      ARCH: ${{ inputs.arch }}
+      CCACHE_DIR: ${{ github.workspace }}/mlir-tensorrt/ccache
+      CPM_SOURCE_CACHE: ${{ github.workspace }}/mlir-tensorrt/.cache.cpm
+      CMAKE_PRESET: distribution-wheels
+      CCACHE_KEY: mlir-tensorrt-ccache-v1-${{ inputs.arch }}-distribution-wheels
+      # if exact cache key is not matched, fallback to the restore key to restore the cache
+      CCACHE_RESTORE_KEY: mlir-tensorrt-ccache-v1-${{ inputs.arch }}-
+      CPM_KEY: mlir-tensorrt-cpm-v1
+      CPM_RESTORE_KEY: mlir-tensorrt-cpm-v1
+      WHEELS_DIR: ${{ github.workspace }}/mlir-tensorrt/.wheels/
+    runs-on: ${{ inputs.github_runner }}
+    timeout-minutes: 120
+    container:
+      image: ${{ matrix.docker_image }}
+      options: >-
+        --gpus all
+        --shm-size=1g
+    steps:
+      # Checkout the repository
+      - name: Checkout TensorRT-Incubator
+        uses: actions/checkout@v5
+        with:
+          fetch-depth: 5
+
+      # Create cache folders
+      - name: Create Cache Folders
+        run: |
+          set -euo pipefail
+          set -x
+          mkdir -p ${{ env.CCACHE_DIR }}
+          mkdir -p ${{ env.CPM_SOURCE_CACHE }}
+
+      # Restore cache, if exists.
+      - name: Restore CCache
+        id: restore-ccache
+        uses: actions/cache/restore@v4
+        with:
+          key: ${{ env.CCACHE_KEY }}
+          restore-keys: |
+            ${{ env.CCACHE_RESTORE_KEY }}
+          path: |
+            ${{ env.CCACHE_DIR }}
+
+      - name: Restore CPM cache
+        id: restore-cpm
+        uses: actions/cache/restore@v4
+        with:
+          key: ${{ env.CPM_KEY }}
+          enableCrossOsArchive: true
+          restore-keys: |
+            ${{ env.CPM_RESTORE_KEY }}
+          # exclude only works for the relative path pattern
+          # restore must use the exactly same path defined in the save step, cannot ignore the exclude path
+          path: |
+            mlir-tensorrt/.cache.cpm/*
+            !mlir-tensorrt/.cache.cpm/tensorrt
+            !mlir-tensorrt/.cache.cpm/tensorrt/**
+
+      # Build wheels
+      - name: Build Wheels With CUDA:${{ matrix.cuda }} + TensorRT:${{ matrix.trt }}
+        env:
+          ENABLE_ASAN: "OFF"
+        run: |
+          set -euo pipefail
+          set -x
+          cd mlir-tensorrt
+          export MTRT_TENSORRT_VERSION=${{ matrix.trt }}
+          # TODO: remove this, once patch is in our rockylinux prebuilt image
+          dnf install -yq patch
+          # mlir-tensorrt-tools is not cuda, trt dependent, so we only build it once
+          # mlir-tensorrt-compiler, mlir-tensorrt-runtime is built per cuda, trt version
+          if [[ "${{ matrix.cuda }}" == "${{ env.LATEST_CUDA_VERSION }}" && "${{ matrix.trt }}" == "${{env.LATEST_TENSORRT_VERSION }}" ]]; then
+            ./build_tools/scripts/cicd-build-wheels.sh
+          else
+            PACKAGES="mlir_tensorrt_compiler mlir_tensorrt_runtime" \
+            ./build_tools/scripts/cicd-build-wheels.sh
+          fi
+
+      # Save ccache when cache is not hit or cache was a fallback(cache-matched is not the same as the cache key)
+      - name: Save CCache
+        uses: actions/cache/save@v4
+        if: ${{ steps.restore-ccache.outputs.cache-hit != 'true' || steps.restore-ccache.outputs['cache-matched-key'] != env.CCACHE_KEY }}
+        with:
+          key: ${{ env.CCACHE_KEY }}
+          path: |
+            ${{ env.CCACHE_DIR }}
+
+      # Save cpm cache
+      - name: Save CPM Cache
+        # cpm cache is shared across x86_64 and aarch64, we let only x86_64 to save cpm cache when in cache miss case
+        # this is to avoid both x86_64 and aarch64 to save cpm cache when in cache miss case
+        if: ${{ inputs.arch == 'x86_64' &&
+              (
+                steps.restore-cpm.outputs.cache-hit != 'true' ||
+                steps.restore-cpm.outputs['cache-matched-key'] != env.CPM_KEY
+              )
+            }}
+        uses: actions/cache/save@v4
+        with:
+          key: ${{ env.CPM_KEY }}
+          enableCrossOsArchive: true
+          # exclude only works for the relative path pattern
+          path: |
+            mlir-tensorrt/.cache.cpm/*
+            !mlir-tensorrt/.cache.cpm/tensorrt
+            !mlir-tensorrt/.cache.cpm/tensorrt/**
+
+      # Upload wheels to GitHub Actions artifact
+      - name: Upload Wheels
+        uses: actions/upload-artifact@v4
+        with:
+          name: release-wheels-${{ inputs.arch }}-cu${{ matrix.cuda }}-trt${{ matrix.trt }}
+          path: ${{ env.WHEELS_DIR }}
+          if-no-files-found: error
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref_name }}-mlir-tensorrt-release-${{ inputs.arch }}
+  cancel-in-progress: true
@@ -10,12 +10,20 @@
     "release": ["12.9", "13.0"],
 }
 
+LATEST_CUDA_VERSION = "13.0"
+LATEST_TRT_VERSION = "10.13"
+
 TRT_VERSIONS_DICT = {
     "nightly": ["10.12", "10.13"],
     "test": ["10.13"],
     "release": ["10.12", "10.13"],
 }
 
+TRT_VERSIONS_CUDA_MIN_MAX_DICT = {
+    "10.12": {"min_cuda_version": "12.9", "max_cuda_version": "12.9"},
+    "10.13": {"min_cuda_version": "12.9", "max_cuda_version": "13.0"},
+}
+
 CMAKE_PRESET_DICT = {
     "nightly": "github-cicd",
     "test": "github-cicd",
@@ -40,6 +48,10 @@
 }
 
 
+def _version_tuple(version: str) -> tuple[int, ...]:
+    return tuple(int(part) for part in version.split("."))
+
+
 def main(args: list[str]) -> None:
     parser = argparse.ArgumentParser()
     parser.add_argument(
@@ -64,12 +76,30 @@ def main(args: list[str]) -> None:
     matrix_dict = {"include": []}
     for cuda_version in cuda_versions:
         for trt_version in trt_versions:
+            if trt_version not in TRT_VERSIONS_CUDA_MIN_MAX_DICT:
+                raise Exception(
+                    f"TRT version {trt_version} is not in TRT_VERSIONS_CUDA_MIN_MAX_DICT"
+                )
+            min_cuda_version = TRT_VERSIONS_CUDA_MIN_MAX_DICT[trt_version][
+                "min_cuda_version"
+            ]
+            max_cuda_version = TRT_VERSIONS_CUDA_MIN_MAX_DICT[trt_version][
+                "max_cuda_version"
+            ]
+            if not (
+                _version_tuple(min_cuda_version)
+                <= _version_tuple(cuda_version)
+                <= _version_tuple(max_cuda_version)
+            ):
+                continue
             matrix_dict["include"].append(
                 {
                     "cuda": cuda_version,
                     "trt": trt_version,
                     "docker_image": docker_images[cuda_version],
                     "cmake_preset": cmake_preset,
+                    "latest_cuda": LATEST_CUDA_VERSION,
+                    "latest_trt": LATEST_TRT_VERSION,
                 }
             )
     print(json.dumps(matrix_dict))
 
@@ -0,0 +1 @@
+**/*.td
@@ -7,6 +7,7 @@ include(MTRTCMakePolicy NO_POLICY_SCOPE)
 include(CMakeDependentOption)
 include(CMakePrintHelpers)
 include(MTRTCPM)
+include(MTRTCMakeExtras)
 include(MTRTDependencies)
 include(MTRTFeatures)
 include(AddMLIRTensorRT)
 
@@ -39,9 +39,11 @@ mtrt_option(MLIR_TRT_RELATIVE_DEBUG_PATHS
 # whereas the definition of the source groups belonging to those packages
 # are distributed across multiple sub-directories.
 set(MLIR_TRT_ENABLE_PROJECTS_DEFAULT
-  executor tensorrt compiler
+  executor tensorrt
 )
 
+list(APPEND MLIR_TRT_ENABLE_PROJECTS_DEFAULT "compiler")
+
 if(MLIR_TRT_ENABLE_PYTHON)
   list(APPEND MLIR_TRT_ENABLE_PROJECTS_DEFAULT "integrations/python")
 endif()
@@ -74,3 +76,4 @@ if(MLIR_TRT_ENABLE_NCCL)
 else()
   set(MLIR_TRT_NCCL_TARGET "" CACHE INTERNAL "")
 endif()
+
@@ -3,3 +3,11 @@ set(MLIR_TENSORRT_VERSION_MINOR "4")
 set(MLIR_TENSORRT_VERSION_PATCH "3")
 set(MLIR_TENSORRT_VERSION
   "${MLIR_TENSORRT_VERSION_MAJOR}.${MLIR_TENSORRT_VERSION_MINOR}.${MLIR_TENSORRT_VERSION_PATCH}")
+
+# The source release script replaces the empty string with a actual
+# hash, so don't change the default here.
+set(MLIR_TENSORRT_GIT_HASH "")
+
+set(CPACK_PACKAGE_VERSION_MAJOR ${MLIR_TENSORRT_VERSION_MAJOR})
+set(CPACK_PACKAGE_VERSION_MINOR ${MLIR_TENSORRT_VERSION_MINOR})
+set(CPACK_PACKAGE_VERSION_PATCH ${MLIR_TENSORRT_VERSION_PATCH})
@@ -332,6 +332,8 @@ function(mtrt_add_project_library name)
     add_mlir_library(${name} ${lib_type_args} DISABLE_INSTALL EXCLUDE_FROM_LIBMLIR ${ARG_UNPARSED_ARGUMENTS})
   endif()
 
+  mtrt_apply_extra_check_options("${name}")
+
   if(ARG_MLIR_LIBS)
     list(POP_FRONT ARG_MLIR_LIBS VISIBILITY)
     mtrt_target_link_mlir_libraries(${name} ${VISIBILITY} ${ARG_MLIR_LIBS})