This commit is contained in:
hailin 2025-09-19 14:51:11 +08:00
parent f51605ad62
commit 662f4e8815
1 changed files with 3 additions and 2 deletions

View File

@ -82,7 +82,7 @@ RUN python3 -m pip install --no-cache-dir numpy requests build "cuda-python>=12.
python3 -m build --no-isolation --wheel && \ python3 -m build --no-isolation --wheel && \
ls -lh dist/ ls -lh dist/
COPY ./sglang /sgl/sglang
# # ── 🔄 下载 sgl-kernel与 sglang 同步)─────────────────────────────────────── # # ── 🔄 下载 sgl-kernel与 sglang 同步)───────────────────────────────────────
# RUN pip download --only-binary=:all: --no-deps sgl-kernel==0.3.9.post2 -d /tmp/sgl_kernel_wheels # RUN pip download --only-binary=:all: --no-deps sgl-kernel==0.3.9.post2 -d /tmp/sgl_kernel_wheels
@ -103,6 +103,7 @@ RUN bash -lc '\
/usr/local/cuda/bin/ptxas --version \ /usr/local/cuda/bin/ptxas --version \
' '
# 限制构建并行;避免 ptxas 多线程崩溃 # 限制构建并行;避免 ptxas 多线程崩溃
ENV CMAKE_BUILD_PARALLEL_LEVEL=8 ENV CMAKE_BUILD_PARALLEL_LEVEL=8
ENV SGL_KERNEL_COMPILE_THREADS=1 ENV SGL_KERNEL_COMPILE_THREADS=1
@ -136,7 +137,7 @@ RUN pip download --only-binary=:all: --no-deps vllm==0.9.1 -d /tmp/vllm_wheels
# ── 编译你本地 sglang 源码并打 wheel ─────────────────────────────────────── # ── 编译你本地 sglang 源码并打 wheel ───────────────────────────────────────
COPY ./sglang /sgl/sglang # COPY ./sglang /sgl/sglang
# WORKDIR /sgl/sglang/python # WORKDIR /sgl/sglang/python
# RUN python3 -m pip install ".[srt,openai]" --no-build-isolation && \ # RUN python3 -m pip install ".[srt,openai]" --no-build-isolation && \
# python3 -m pip wheel ".[srt,openai]" --no-deps -w /tmp/sg_wheels # python3 -m pip wheel ".[srt,openai]" --no-deps -w /tmp/sg_wheels