From 4c79f1faf1726db8aed08df1dbe23a5265b13c31 Mon Sep 17 00:00:00 2001 From: Qubitium Date: Mon, 27 Oct 2025 08:14:23 +0000 Subject: [PATCH] update scores --- tests/models/test_qwen2_5.py | 10 +++------- 1 file changed, 3 insertions(+), 7 deletions(-) diff --git a/tests/models/test_qwen2_5.py b/tests/models/test_qwen2_5.py index e2ef3c0b8..ae194898c 100644 --- a/tests/models/test_qwen2_5.py +++ b/tests/models/test_qwen2_5.py @@ -19,17 +19,13 @@ class TestQwen2_5(ModelTest): EVAL_BATCH_SIZE = 64 EVAL_TASKS = { EVAL.LM_EVAL.ARC_CHALLENGE: { - "chat_template": True, - "acc": {"value": 0.2892, "floor_pct": 0.04}, - "acc_norm": {"value": 0.3302, "floor_pct": 0.04}, + "acc": {"value": 0.2910, "floor_pct": 0.04}, + "acc_norm": {"value": 0.3268, "floor_pct": 0.04}, }, EVAL.LM_EVAL.MMLU_STEM: { - "acc": {"value": 0.4351, "floor_pct": 0.04}, + "acc": {"value": 0.3819, "floor_pct": 0.04}, }, } - #TRUST_REMOTE_CODE = False - #APPLY_CHAT_TEMPLATE = True - #EVAL_BATCH_SIZE = 6 def test_qwen2_5(self): self.quant_lm_eval()