diff --git a/Dockerfile b/Dockerfile index 4a01b13..f407de0 100644 --- a/Dockerfile +++ b/Dockerfile @@ -62,9 +62,9 @@ RUN pip install -r /tmp/requirements.txt && rm -rf /root/.cache/pip # Compile SageAttention 2.2 from source with no build isolation WORKDIR /tmp -ENV EXT_PARALLEL=4 -ENV NVCC_APPEND_FLAGS="--threads 8" -ENV MAX_JOBS=32 +ENV EXT_PARALLEL=2 +ENV NVCC_APPEND_FLAGS="--threads 2" +ENV MAX_JOBS=4 # Target RunPod GPU architectures: H100/H200(9.0), RTX 5090/Blackwell(10.0) ENV TORCH_CUDA_ARCH_LIST="9.0;10.0" RUN git clone https://github.com/thu-ml/SageAttention.git && \