This commit is contained in:
parent
c5e4ef4a6d
commit
a2a93c7c4c
|
|
@ -160,7 +160,7 @@ RUN chmod +x /tini
|
||||||
ENTRYPOINT ["/tini", "--"]
|
ENTRYPOINT ["/tini", "--"]
|
||||||
|
|
||||||
# ---- 拷贝模型(路径可换) ----
|
# ---- 拷贝模型(路径可换) ----
|
||||||
COPY ./Alibaba/Qwen3-32B /root/.cradle/Alibaba/Qwen3-32B
|
COPY ./Alibaba/Qwen3-14B /root/.cradle/Alibaba/Qwen3-14B
|
||||||
|
|
||||||
HEALTHCHECK --interval=30s --timeout=2s --start-period=300s --retries=5 CMD curl -fs http://localhost:30000/health || exit 1
|
HEALTHCHECK --interval=30s --timeout=2s --start-period=300s --retries=5 CMD curl -fs http://localhost:30000/health || exit 1
|
||||||
|
|
||||||
|
|
@ -171,7 +171,7 @@ EXPOSE 30000
|
||||||
CMD ["python3", "-m", "sglang.launch_server", \
|
CMD ["python3", "-m", "sglang.launch_server", \
|
||||||
"--host", "0.0.0.0", \
|
"--host", "0.0.0.0", \
|
||||||
"--port", "30000", \
|
"--port", "30000", \
|
||||||
"--model-path", "/root/.cradle/Alibaba/Qwen3-32B/", \
|
"--model-path", "/root/.cradle/Alibaba/Qwen3-14B/", \
|
||||||
"--tp", "4", \
|
"--tp", "2", \
|
||||||
"--api-key", "token-abc123", \
|
"--api-key", "token-abc123", \
|
||||||
"--enable-metrics"]
|
"--enable-metrics"]
|
||||||
|
|
@ -160,7 +160,7 @@ RUN chmod +x /tini
|
||||||
ENTRYPOINT ["/tini", "--"]
|
ENTRYPOINT ["/tini", "--"]
|
||||||
|
|
||||||
# ---- 拷贝模型(路径可换) ----
|
# ---- 拷贝模型(路径可换) ----
|
||||||
COPY ./Alibaba/Qwen3-14B /root/.cradle/Alibaba/Qwen3-14B
|
COPY ./Alibaba/Qwen3-32B /root/.cradle/Alibaba/Qwen3-32B
|
||||||
|
|
||||||
HEALTHCHECK --interval=30s --timeout=2s --start-period=300s --retries=5 CMD curl -fs http://localhost:30000/health || exit 1
|
HEALTHCHECK --interval=30s --timeout=2s --start-period=300s --retries=5 CMD curl -fs http://localhost:30000/health || exit 1
|
||||||
|
|
||||||
|
|
@ -171,7 +171,7 @@ EXPOSE 30000
|
||||||
CMD ["python3", "-m", "sglang.launch_server", \
|
CMD ["python3", "-m", "sglang.launch_server", \
|
||||||
"--host", "0.0.0.0", \
|
"--host", "0.0.0.0", \
|
||||||
"--port", "30000", \
|
"--port", "30000", \
|
||||||
"--model-path", "/root/.cradle/Alibaba/Qwen3-14B/", \
|
"--model-path", "/root/.cradle/Alibaba/Qwen3-32B/", \
|
||||||
"--tp", "1", \
|
"--tp", "4", \
|
||||||
"--api-key", "token-abc123", \
|
"--api-key", "token-abc123", \
|
||||||
"--enable-metrics"]
|
"--enable-metrics"]
|
||||||
Loading…
Reference in New Issue