From 40b6d3cf0e4751299080c1d63a859c48c1f670b9 Mon Sep 17 00:00:00 2001 From: Anupam Kumar Date: Tue, 10 Mar 2026 14:22:21 +0530 Subject: [PATCH] fix: adjust inference params to limit small input repetition Signed-off-by: Anupam Kumar --- config.json | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/config.json b/config.json index ac5e1f9..d82d550 100644 --- a/config.json +++ b/config.json @@ -18,6 +18,8 @@ "max_batch_size": 8192, "sampling_temperature": 0.0001, "disable_unk": true, - "max_decoding_length": 10000 + "max_decoding_length": 10000, + "repetition_penalty": 1.3, + "patience": 1.5 } }