From 29de4e141101a199a1062ddb81945321f5b351fd Mon Sep 17 00:00:00 2001 From: hailin Date: Sun, 14 Sep 2025 19:12:27 +0800 Subject: [PATCH] . --- Dockerfile | 2 +- Dockerfile.llm_lora_external => Dockerfile.tmp | 2 +- supervisord.conf | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) rename Dockerfile.llm_lora_external => Dockerfile.tmp (99%) diff --git a/Dockerfile b/Dockerfile index cd7006e..3c621ad 100644 --- a/Dockerfile +++ b/Dockerfile @@ -172,7 +172,7 @@ RUN chmod +x /tini ENTRYPOINT ["/tini", "--"] # ---- 拷贝模型(路径可换) ---- -COPY ./Alibaba/Qwen3-30B-A3B /root/.cradle/Alibaba/Qwen3-30B-A3B +# COPY ./Alibaba/Qwen3-30B-A3B /root/.cradle/Alibaba/Qwen3-30B-A3B HEALTHCHECK --interval=30s --timeout=2s --start-period=300s --retries=5 CMD curl -fs http://localhost:30000/health || exit 1 diff --git a/Dockerfile.llm_lora_external b/Dockerfile.tmp similarity index 99% rename from Dockerfile.llm_lora_external rename to Dockerfile.tmp index 3c621ad..cd7006e 100644 --- a/Dockerfile.llm_lora_external +++ b/Dockerfile.tmp @@ -172,7 +172,7 @@ RUN chmod +x /tini ENTRYPOINT ["/tini", "--"] # ---- 拷贝模型(路径可换) ---- -# COPY ./Alibaba/Qwen3-30B-A3B /root/.cradle/Alibaba/Qwen3-30B-A3B +COPY ./Alibaba/Qwen3-30B-A3B /root/.cradle/Alibaba/Qwen3-30B-A3B HEALTHCHECK --interval=30s --timeout=2s --start-period=300s --retries=5 CMD curl -fs http://localhost:30000/health || exit 1 diff --git a/supervisord.conf b/supervisord.conf index c494666..eee4c52 100644 --- a/supervisord.conf +++ b/supervisord.conf @@ -5,7 +5,7 @@ logfile_maxbytes=0 loglevel=info [program:sglang] -command=python3 -m sglang.launch_server --host 0.0.0.0 --port 30000 --model-path /root/.cradle/external/llm/ --lora-paths q3=/root/.cradle/external/lora/q3 --tp 4 --api-key token-abc123 --enable-metrics +command=python3 -m sglang.launch_server --host 0.0.0.0 --port 30000 --model-path /root/.cradle/external/llm/ --lora-paths q3=/root/.cradle/external/lora/q3 --disable-radix-cache --tp 4 --api-key token-abc123 --enable-metrics autostart=true autorestart=true stdout_logfile=/dev/stdout