This commit is contained in:
hailin 2025-08-05 17:05:14 +08:00
parent 61962c074b
commit 0b75bf040e
1 changed files with 10 additions and 9 deletions

View File

@ -212,13 +212,6 @@ class EmbeddingRequest(BaseModel):
model: str = "text-embedding-bge-m3" model: str = "text-embedding-bge-m3"
def _encode(texts: List[str]):
"""
单次请求
1. 子进程跑 GPU 推理成功返回
2. 若子进程 OOM / CUDA Error 同一次请求 fallback CPU
绝不改全局状态其他并发请求不受影响
"""
# ③ -------- _encode() 里 worker 调用 -------- # ③ -------- _encode() 里 worker 调用 --------
def _worker(t, q): def _worker(t, q):
try: try:
@ -228,6 +221,14 @@ def _encode(texts: List[str]):
except Exception as e: except Exception as e:
q.put(("err", str(e))) q.put(("err", str(e)))
def _encode(texts: List[str]):
"""
单次请求
1. 子进程跑 GPU 推理成功返回
2. 若子进程 OOM / CUDA Error 同一次请求 fallback CPU
绝不改全局状态其他并发请求不受影响
"""
q = mp.Queue() q = mp.Queue()
p = mp.Process(target=_worker, args=(texts, q)) p = mp.Process(target=_worker, args=(texts, q))
p.start() p.start()