51 lines
1.6 KiB
Python
51 lines
1.6 KiB
Python
import gradio as gr
|
|
|
|
def run_eval(inputs, native, other, outputs):
|
|
result = (
|
|
f"\n[Eval Started]\n"
|
|
f"Inputs: {inputs}\n"
|
|
f"Native Modules: {native}\n"
|
|
f"Other Backends: {other}\n"
|
|
f"Outputs: {outputs}\n"
|
|
f"[Eval Finished]"
|
|
)
|
|
return result
|
|
|
|
with gr.Blocks(title="EvalScope 全功能界面") as demo:
|
|
with gr.Group():
|
|
with gr.Row():
|
|
input_choices = gr.CheckboxGroup(
|
|
label="选择输入源",
|
|
choices=["API Models", "Local Models", "Benchmarks", "Custom Datasets"]
|
|
)
|
|
|
|
with gr.Row():
|
|
with gr.Column():
|
|
with gr.Group():
|
|
native_choices = gr.CheckboxGroup(
|
|
label="启用本地模块",
|
|
choices=["Model Adapter", "Data Adapter", "Evaluator", "Perf Monitor"]
|
|
)
|
|
|
|
with gr.Column():
|
|
with gr.Group():
|
|
other_choices = gr.CheckboxGroup(
|
|
label="启用外部后端",
|
|
choices=["OpenCompass", "VLMEvalKit", "RAGAS", "MTEB/CMTEB"]
|
|
)
|
|
|
|
with gr.Group():
|
|
with gr.Row():
|
|
output_choices = gr.CheckboxGroup(
|
|
label="输出形式",
|
|
choices=["Evaluation Report", "Gradio", "WandB", "Swanlab"]
|
|
)
|
|
|
|
run_button = gr.Button("Run Evaluation")
|
|
output_text = gr.Textbox(label="执行结果", lines=10)
|
|
|
|
run_button.click(run_eval, inputs=[input_choices, native_choices, other_choices, output_choices], outputs=output_text)
|
|
|
|
if __name__ == '__main__':
|
|
demo.launch(server_name="0.0.0.0", server_port=7900)
|