try build flashattention

DevakiBolleneni · DevakiBolleneni · commit 3f9d049267fc · 2025-12-02T14:53:41.000-08:00
diff --git a/pytorch/training/docker/2.9/py3/cu130/Dockerfile.arm64.gpu b/pytorch/training/docker/2.9/py3/cu130/Dockerfile.arm64.gpu
@@ -240,7 +240,7 @@ ENV LD_PRELOAD="/usr/local/lib/libnccl.so"
 ENV NVTE_FRAMEWORK=pytorch
 # Install flash-attn using instructions from https://github.com/Dao-AILab/flash-attention#installation-and-features
 # Set MAX_JOBS=4 to avoid OOM issues in installation process
-RUN MAX_JOBS=8 pip install --no-cache-dir flash-attn==${FLASH_ATTN_VERSION} --no-build-isolation --verbose
+RUN MAX_JOBS=4 pip install --no-cache-dir flash-attn==${FLASH_ATTN_VERSION} --verbose
 # Install TE using instructions from https://docs.nvidia.com/deeplearning/transformer-engine/user-guide/installation.html
 RUN pip install --no-cache-dir git+https://github.com/NVIDIA/TransformerEngine.git@release_v${TE_VERSION} --no-build-isolation