This commit is contained in:
hailin 2025-08-05 17:01:05 +08:00
parent 9e0c85b93a
commit 61962c074b
1 changed files with 21 additions and 16 deletions

View File

@ -179,9 +179,7 @@ tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
app = FastAPI()
logger.info("Using SAFE_MIN_FREE_MB = %d MB", SAFE_MIN_FREE_MB)
# ② -------- FastAPI 启动预热 --------
@app.on_event("startup")
def warm_up():
def _warm_worker(t, q):
try:
_ = model.encode(t, return_dense=True, num_processes=1)
@ -189,6 +187,11 @@ def warm_up():
except Exception as e:
q.put(str(e))
# ② -------- FastAPI 启动预热 --------
@app.on_event("startup")
def warm_up():
logger.info("Warm-up on %s", DEVICE)
try:
texts = ["warmup"]
q = mp.Queue()
p = mp.Process(target=_warm_worker, args=(texts, q))
@ -199,6 +202,8 @@ def warm_up():
logger.info("Warm-up complete.")
else:
logger.warning("Warm-up failed or timed out.")
except Exception as e:
logger.warning("Warm-up exception: %s", e)