diff --git a/lightllm/server/router/model_infer/mode_backend/chunked_prefill/impl.py b/lightllm/server/router/model_infer/mode_backend/chunked_prefill/impl.py index 35e68136d..2c3cfaf11 100644 --- a/lightllm/server/router/model_infer/mode_backend/chunked_prefill/impl.py +++ b/lightllm/server/router/model_infer/mode_backend/chunked_prefill/impl.py @@ -46,6 +46,8 @@ def __init__(self) -> None: else: self.prefill = self.prefill_normal self.decode = self.decode_normal + + self.classed_req_strict_prefill = False return def infer_loop(self): diff --git a/lightllm/server/router/model_infer/mode_backend/dp_backend/impl.py b/lightllm/server/router/model_infer/mode_backend/dp_backend/impl.py index 8d47d1057..633102571 100644 --- a/lightllm/server/router/model_infer/mode_backend/dp_backend/impl.py +++ b/lightllm/server/router/model_infer/mode_backend/dp_backend/impl.py @@ -58,6 +58,8 @@ def __init__(self) -> None: self.decode = self.decode_overlap else: self.decode = self.decode_normal + + self.classed_req_strict_prefill = False return def infer_loop(self):