From 8be830f035c8b4c481ba8445305c2832d4402913 Mon Sep 17 00:00:00 2001 From: hailin Date: Wed, 17 Sep 2025 17:23:53 +0800 Subject: [PATCH] . --- Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Dockerfile b/Dockerfile index 53f3e6bc1..ad0dec3da 100644 --- a/Dockerfile +++ b/Dockerfile @@ -77,7 +77,7 @@ WORKDIR /opt/flashinfer ENV FLASHINFER_CUDA_ARCH_LIST="7.5 8.0 8.6 8.9 9.0a" # 先做 AOT 预编译,再直接打 wheel(不隔离,使用同一份自编 torch) -RUN python3 -m pip install --no-cache-dir numpy requests build "cuda-python>=12.0,<13" pynvml && \ +RUN python3 -m pip install --no-cache-dir numpy requests build "cuda-python>=12.0,<13" "nvidia-nvshmem-cu12" pynvml && \ python3 -m flashinfer.aot && \ python3 -m build --no-isolation --wheel && \ ls -lh dist/