# For vllm script, with -t option (tensor parallel size). # bash ./run-lm-eval-gsm-vllm-baseline.sh -m neuralmagic/Mixtral-8x7B-Instruct-v0.1-FP8 -b "auto" -l 250 -f 5 -t 4 model_name: "neuralmagic/Mixtral-8x7B-Instruct-v0.1-FP8" tasks: - name: "gsm8k" metrics: - name: "exact_match,strict-match" value: 0.624 - name: "exact_match,flexible-extract" value: 0.624 limit: 250 num_fewshot: 5