diff --git a/test/test_cuda/test_gguf.py b/test/test_cuda/test_gguf.py index 50bb23aa6..2272651ab 100644 --- a/test/test_cuda/test_gguf.py +++ b/test/test_cuda/test_gguf.py @@ -252,7 +252,7 @@ def test_llama_4(self): ) self.assertAlmostEqual(file_size, 58093.62, delta=1.0) file_size = os.path.getsize(os.path.join(quantized_model_path, "mmproj-model.gguf")) / 1024**2 - self.assertAlmostEqual(file_size, 3323.52, delta=1.0) + self.assertAlmostEqual(file_size, 3326.18, delta=5.0) shutil.rmtree(quantized_model_path, ignore_errors=True)