diff --git a/tests/evals/gsm8k/configs/Qwen3.5-0.8B.yaml b/tests/evals/gsm8k/configs/Qwen3.5-0.8B.yaml new file mode 100644 index 000000000000..217d269f3177 --- /dev/null +++ b/tests/evals/gsm8k/configs/Qwen3.5-0.8B.yaml @@ -0,0 +1,5 @@ +model_name: "Qwen/Qwen3.5-0.8B" +accuracy_threshold: 0.375 +num_questions: 1319 +num_fewshot: 5 +server_args: "--enforce-eager --max-model-len 4096" diff --git a/tests/evals/gsm8k/configs/models-small.txt b/tests/evals/gsm8k/configs/models-small.txt index a6a2f6c64f5f..e836c0d02601 100644 --- a/tests/evals/gsm8k/configs/models-small.txt +++ b/tests/evals/gsm8k/configs/models-small.txt @@ -4,4 +4,5 @@ Llama-3-8B-Instruct-nonuniform-CT.yaml Qwen2.5-VL-3B-Instruct-FP8-dynamic.yaml Qwen1.5-MoE-W4A16-CT.yaml DeepSeek-V2-Lite-Instruct-FP8.yaml -Qwen3-30B-A3B-MXFP4A16.yaml \ No newline at end of file +Qwen3-30B-A3B-MXFP4A16.yaml +Qwen3.5-0.8B.yaml