From 17a102de0bbd6920bf6e3b94b85e0c9156c36414 Mon Sep 17 00:00:00 2001 From: hailin Date: Fri, 4 Jul 2025 08:41:46 +0800 Subject: [PATCH] . --- Dockerfile | 8 +------- 1 file changed, 1 insertion(+), 7 deletions(-) diff --git a/Dockerfile b/Dockerfile index e3241c2..df60a5f 100644 --- a/Dockerfile +++ b/Dockerfile @@ -82,11 +82,6 @@ RUN pip install . && \ WORKDIR /opt RUN pip download --only-binary=:all: --no-deps vllm==0.9.1 -d /tmp/vllm_wheels -# 编译安装compressed_tensors -RUN git clone https://github.com/vllm-project/compressed-tensors.git && \ - cd compressed-tensors && \ - pip install . && \ - python3 -m pip wheel . --no-deps -w /tmp/compressed_tensors_wheels # ── 编译你本地 sglang 源码并打 wheel ─────────────────────────────────────── COPY ./sglang /sgl/sglang @@ -102,14 +97,13 @@ RUN mkdir -p /wheels && \ cp /opt/flashinfer/dist/flashinfer_python-*.whl /wheels/ && \ cp /tmp/vllm_wheels/vllm-*.whl /wheels/ && \ cp /tmp/sg_wheels/sglang-*.whl /wheels/ && \ - cp /tmp/compressed_tensors/compressed_tensors*.whl /wheels/ && \ pip wheel filelock typing-extensions sympy fsspec jinja2 networkx -w /wheels # ── ✅ 再打包 runtime 阶段必需依赖 ──────────────────────────────────────────── RUN pip wheel \ pydantic orjson psutil pyzmq pynvml \ transformers==4.52.0 uvicorn fastapi IPython aiohttp \ - setproctitle uvloop sentencepiece triton pillow cachetools msgspec blake3 cloudpickle \ + setproctitle uvloop sentencepiece triton pillow cachetools msgspec blake3 cloudpickle compressed-tensors \ -w /wheels ###############################################################################