import gradio as gr def run_eval(inputs, native, other, outputs): result = ( f"\n[Eval Started]\n" f"Inputs: {inputs}\n" f"Native Modules: {native}\n" f"Other Backends: {other}\n" f"Outputs: {outputs}\n" f"[Eval Finished]" ) return result with gr.Blocks(title="EvalScope 全功能界面") as demo: with gr.Group(): with gr.Row(): input_choices = gr.CheckboxGroup( label="选择输入源", choices=["API Models", "Local Models", "Benchmarks", "Custom Datasets"] ) with gr.Row(): with gr.Column(): with gr.Group(): native_choices = gr.CheckboxGroup( label="启用本地模块", choices=["Model Adapter", "Data Adapter", "Evaluator", "Perf Monitor"] ) with gr.Column(): with gr.Group(): other_choices = gr.CheckboxGroup( label="启用外部后端", choices=["OpenCompass", "VLMEvalKit", "RAGAS", "MTEB/CMTEB"] ) with gr.Group(): with gr.Row(): output_choices = gr.CheckboxGroup( label="输出形式", choices=["Evaluation Report", "Gradio", "WandB", "Swanlab"] ) run_button = gr.Button("Run Evaluation") output_text = gr.Textbox(label="执行结果", lines=10) run_button.click(run_eval, inputs=[input_choices, native_choices, other_choices, output_choices], outputs=output_text) if __name__ == '__main__': demo.launch(server_name="0.0.0.0", server_port=7900)