diff --git a/gradio_ui.py b/gradio_ui.py index ace9790..a864421 100644 --- a/gradio_ui.py +++ b/gradio_ui.py @@ -26,9 +26,9 @@ should_stop = False # ---------------- 可选数据集 ---------------- EVAL_DATASETS = [ - "arc", "bbh", "ceval", "cmmlu", "competition_math", "gsm8k", - "hellaswag", "humaneval", "mmlu", "mmlu_pro", "race", - "trivia_qa", "truthful_qa" + "arc", "bbh", "ifeval", "ceval", "cmmlu", "competition_math", "gsm8k", + "hellaswag", "humaneval", "mmlu", "mmlu_redux", "mmlu_pro", "race", + "trivia_qa", "truthful_qa", "tool_bench" ] PERF_DATASETS = [ "openqa", "flickr8k", "longalpaca",