From bdc1d769e899ba842f554baae71dac78ba07ce12 Mon Sep 17 00:00:00 2001 From: Nick Date: Fri, 26 Dec 2025 12:09:57 +1300 Subject: [PATCH] Set TORCH_CUDA_ARCH_LIST for SageAttention build MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Build runner has no GPU, so specify target architectures explicitly. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Opus 4.5 --- Dockerfile | 2 ++ 1 file changed, 2 insertions(+) diff --git a/Dockerfile b/Dockerfile index 8b93350..448a955 100644 --- a/Dockerfile +++ b/Dockerfile @@ -65,6 +65,8 @@ WORKDIR /tmp ENV EXT_PARALLEL=4 ENV NVCC_APPEND_FLAGS="--threads 8" ENV MAX_JOBS=32 +# Target RunPod GPU architectures: A100(8.0), RTX 30xx(8.6), RTX 40xx(8.9), H100(9.0) +ENV TORCH_CUDA_ARCH_LIST="8.0;8.6;8.9;9.0" RUN git clone https://github.com/thu-ml/SageAttention.git && \ cd SageAttention && \ pip install --no-build-isolation . && \