From eec8be70d255c8cd340161b7abde5ac233234255 Mon Sep 17 00:00:00 2001 From: James Le Houx Date: Wed, 27 May 2026 13:42:24 +0000 Subject: [PATCH] wheels: use sm_75-virtual PTX so T4 can JIT-compile MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit sm_90 PTX is forward-compatible only — sm_75 (T4) can't JIT it. Change to 75-virtual: T4 JITs from sm_75 PTX, A100 uses sm_80 SASS, H100 JITs from sm_75 PTX (forward-compatible). --- .github/workflows/pypi-wheels-gpu.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/pypi-wheels-gpu.yml b/.github/workflows/pypi-wheels-gpu.yml index c9d4322..815bd55 100644 --- a/.github/workflows/pypi-wheels-gpu.yml +++ b/.github/workflows/pypi-wheels-gpu.yml @@ -138,7 +138,7 @@ jobs: -DAMReX_GPU_BACKEND=CUDA '-DAMReX_CUDA_ARCH=80' -DCMAKE_POSITION_INDEPENDENT_CODE=ON - '-DCMAKE_CUDA_ARCHITECTURES=80-real;90-virtual' + '-DCMAKE_CUDA_ARCHITECTURES=80-real;75-virtual' -DCMAKE_CUDA_HOST_COMPILER=/opt/rh/gcc-toolset-13/root/usr/bin/g++ '-DCMAKE_CUDA_FLAGS=-Xfatbin --compress-all' && cmake --build /tmp/amrex/build -j$(nproc) && @@ -175,7 +175,7 @@ jobs: CMAKE_CXX_COMPILER="mpicxx" CMAKE_PREFIX_PATH="/usr/local" CMAKE_GENERATOR="Unix Makefiles" - CMAKE_ARGS="-DGPU_BACKEND=CUDA '-DCMAKE_CUDA_ARCHITECTURES=80-real;90-virtual' -DCMAKE_CUDA_HOST_COMPILER=/opt/rh/gcc-toolset-13/root/usr/bin/g++" + CMAKE_ARGS="-DGPU_BACKEND=CUDA '-DCMAKE_CUDA_ARCHITECTURES=80-real;75-virtual' -DCMAKE_CUDA_HOST_COMPILER=/opt/rh/gcc-toolset-13/root/usr/bin/g++" CUDAFLAGS="-Xfatbin --compress-all" SETUPTOOLS_SCM_PRETEND_VERSION="${{ steps.version.outputs.version }}"