This commit is contained in:
hailin 2025-09-17 17:23:53 +08:00
parent d6123b49e6
commit 8be830f035
1 changed files with 1 additions and 1 deletions

View File

@ -77,7 +77,7 @@ WORKDIR /opt/flashinfer
ENV FLASHINFER_CUDA_ARCH_LIST="7.5 8.0 8.6 8.9 9.0a" ENV FLASHINFER_CUDA_ARCH_LIST="7.5 8.0 8.6 8.9 9.0a"
# 先做 AOT 预编译,再直接打 wheel不隔离使用同一份自编 torch # 先做 AOT 预编译,再直接打 wheel不隔离使用同一份自编 torch
RUN python3 -m pip install --no-cache-dir numpy requests build "cuda-python>=12.0,<13" pynvml && \ RUN python3 -m pip install --no-cache-dir numpy requests build "cuda-python>=12.0,<13" "nvidia-nvshmem-cu12" pynvml && \
python3 -m flashinfer.aot && \ python3 -m flashinfer.aot && \
python3 -m build --no-isolation --wheel && \ python3 -m build --no-isolation --wheel && \
ls -lh dist/ ls -lh dist/