'megapak's Fix for SageAttention

YanWenKun · YanWenKun · commit 40207980e6c0 · 2025-11-04T10:18:31.000+08:00
diff --git a/cu126-megapak/Dockerfile b/cu126-megapak/Dockerfile
@@ -295,11 +295,12 @@ RUN --mount=type=cache,target=/root/.cache/pip \
 RUN --mount=type=cache,target=/root/.cache/pip \
     # Update UV
     pip install -U uv \
-    # SageAttention needs PyTorch to build with
-    && pip install sageattention --no-build-isolation \
     # Nunchaku version needs to sync with PyTorch version
     && pip install \
-https://github.com/nunchaku-tech/nunchaku/releases/download/v1.0.1/nunchaku-1.0.1+torch2.8-cp312-cp312-linux_x86_64.whl
+https://github.com/nunchaku-tech/nunchaku/releases/download/v1.0.1/nunchaku-1.0.1+torch2.8-cp312-cp312-linux_x86_64.whl \
+    # SageAttention needs PyTorch to build with
+    && export MAX_JOBS=4 TORCH_CUDA_ARCH_LIST="5.0;6.0;7.0;7.5;8.0;8.6;9.0" \
+    && pip install sageattention --no-build-isolation
 
 # Notes on FlashAttention:
 # <xformers 0.0.32.post2> requires <flash-attn [2.7.1, 2.8.2]>,
diff --git a/cu128-megapak/Dockerfile b/cu128-megapak/Dockerfile
@@ -295,11 +295,12 @@ RUN --mount=type=cache,target=/root/.cache/pip \
 RUN --mount=type=cache,target=/root/.cache/pip \
     # Update UV
     pip install -U uv \
-    # SageAttention needs PyTorch to build with
-    && pip install sageattention --no-build-isolation \
     # Nunchaku version needs to sync with PyTorch version
     && pip install \
-https://github.com/nunchaku-tech/nunchaku/releases/download/v1.0.1/nunchaku-1.0.1+torch2.8-cp312-cp312-linux_x86_64.whl
+https://github.com/nunchaku-tech/nunchaku/releases/download/v1.0.1/nunchaku-1.0.1+torch2.8-cp312-cp312-linux_x86_64.whl \
+    # SageAttention needs PyTorch to build with
+    && export MAX_JOBS=4 TORCH_CUDA_ARCH_LIST="7.0;7.5;8.0;8.6;9.0;10.0;12.0" \
+    && pip install sageattention --no-build-isolation
 
 # Notes on FlashAttention:
 # <xformers 0.0.32.post2> requires <flash-attn [2.7.1, 2.8.2]>,