diff --git a/.buildkite/test-pipeline.yaml b/.buildkite/test-pipeline.yaml index d11a43377548..5198f888c976 100644 --- a/.buildkite/test-pipeline.yaml +++ b/.buildkite/test-pipeline.yaml @@ -867,7 +867,7 @@ steps: - pytest -s -v tests/quantization/test_blackwell_moe.py - label: Blackwell LM Eval Small Models - timeout_in_minutes: 75 + timeout_in_minutes: 120 gpu: b200 optional: true # run on nightlies source_file_dependencies: diff --git a/tests/evals/gsm8k/configs/Qwen3-30B-A3B-NVFP4.yaml b/tests/evals/gsm8k/configs/Qwen3-30B-A3B-NVFP4.yaml new file mode 100644 index 000000000000..6b7bdd1e65bb --- /dev/null +++ b/tests/evals/gsm8k/configs/Qwen3-30B-A3B-NVFP4.yaml @@ -0,0 +1,6 @@ +model_name: "nvidia/Qwen3-30B-A3B-FP4" +accuracy_threshold: 0.89 +num_questions: 1319 +num_fewshot: 5 +max_model_len: 4096 + diff --git a/tests/evals/gsm8k/configs/models-blackwell.txt b/tests/evals/gsm8k/configs/models-blackwell.txt index e577645d60d6..3c9b1084de7b 100644 --- a/tests/evals/gsm8k/configs/models-blackwell.txt +++ b/tests/evals/gsm8k/configs/models-blackwell.txt @@ -2,3 +2,4 @@ Qwen3-0.6B-FP8.yaml Qwen2.5-VL-3B-Instruct-FP8-dynamic.yaml Qwen1.5-MoE-W4A16-CT.yaml DeepSeek-V2-Lite-Instruct-FP8.yaml +Qwen3-30B-A3B-NVFP4.yaml