diff --git a/gradio_ui.py b/gradio_ui.py
index 90d0cc0..c746740 100644
--- a/gradio_ui.py
+++ b/gradio_ui.py
@@ -3,13 +3,12 @@ import gradio as gr
 import subprocess
 
 def run_eval(inputs, native, other, outputs, api_url, api_token):
-    timestamp = time.strftime("%Y%m%d-%H%M%S")  # 生成当前时间戳作为 model 名
-
+    timestamp = time.strftime("%Y%m%d-%H%M%S")
     command = [
         "evalscope", "perf",
         "--url", api_url.strip(),
         "--api", "openai",
-        "--model", timestamp,  # ✅ 使用时间戳作为 --model
+        "--model", timestamp,
         "--dataset", "openqa",
         "--max-tokens", "1024",
         "--min-tokens", "1024",
@@ -19,16 +18,23 @@ def run_eval(inputs, native, other, outputs, api_url, api_token):
         "--api-key", api_token.strip(),
     ]
 
-    yield f"[Eval Started @ {timestamp}]\n"
+    full_output = f"[Eval Started @ {timestamp}]\n"
+    yield full_output
     try:
         process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.STDOUT, text=True, bufsize=1)
         for line in process.stdout:
-            yield line
+            full_output += line
+            yield full_output  # ✅ 每次 yield 累积的完整内容
         process.stdout.close()
         process.wait()
     except Exception as e:
-        yield f"[Error] {str(e)}\n"
-    yield "[Eval Finished]\n"
+        full_output += f"[Error] {str(e)}\n"
+        yield full_output
+    full_output += "[Eval Finished]\n"
+    yield full_output
+
+
+
 def enforce_input_exclusive_and_toggle_fields(selected):
     group1 = {"API Models", "Local Models"}
     group2 = {"Benchmarks", "Custom Datasets"}