From 452ea11b76888dc75c24861c490fc2fb3ef25cde Mon Sep 17 00:00:00 2001 From: freeliuzc Date: Thu, 11 Sep 2025 21:02:43 +0800 Subject: [PATCH 1/2] support rl reshard --- fastdeploy/config.py | 1 + fastdeploy/multimodal/registry.py | 1 + fastdeploy/rl/rollout_config.py | 2 ++ 3 files changed, 4 insertions(+) diff --git a/fastdeploy/config.py b/fastdeploy/config.py index ce794435e4b..4beaffc2c92 100644 --- a/fastdeploy/config.py +++ b/fastdeploy/config.py @@ -134,6 +134,7 @@ def __init__( self.lm_head_fp32: bool = False self.model_format = "auto" self.partial_rotary_factor: float = 1.0 + self.num_nextn_predict_layers = 0 for key, value in args.items(): if hasattr(self, key) and value != "None": setattr(self, key, value) diff --git a/fastdeploy/multimodal/registry.py b/fastdeploy/multimodal/registry.py index ab6c701ddc7..452ef84d713 100644 --- a/fastdeploy/multimodal/registry.py +++ b/fastdeploy/multimodal/registry.py @@ -24,6 +24,7 @@ class MultimodalRegistry: "Ernie4_5_VLMoeForConditionalGeneration", "Ernie5MoeForCausalLM", "Qwen2_5_VLForConditionalGeneration", + "Ernie5UnifyForCausalLM", } @classmethod diff --git a/fastdeploy/rl/rollout_config.py b/fastdeploy/rl/rollout_config.py index d72f4271450..8ec36055cc0 100644 --- a/fastdeploy/rl/rollout_config.py +++ b/fastdeploy/rl/rollout_config.py @@ -63,6 +63,7 @@ def __init__( local_rank: int = 0, moba_attention_config: str = None, data_parallel_size: int = 1, + num_nextn_predict_layers: int = 0, ): # Required parameters self.model = model_name_or_path @@ -109,6 +110,7 @@ def __init__( self.early_stop_config = early_stop_config self.ips = None self.moba_attention_config = moba_attention_config + self.num_nextn_predict_layers = num_nextn_predict_layers def __str__(self): return "\n".join(f"{k}: {v}" for k, v in self.__dict__.items()) From 88ff1000861afb459fb824ab515fc927d9b172ef Mon Sep 17 00:00:00 2001 From: freeliuzc Date: Fri, 12 Sep 2025 17:02:18 +0800 Subject: [PATCH 2/2] modify model name --- fastdeploy/multimodal/registry.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/fastdeploy/multimodal/registry.py b/fastdeploy/multimodal/registry.py index 452ef84d713..f014ba55532 100644 --- a/fastdeploy/multimodal/registry.py +++ b/fastdeploy/multimodal/registry.py @@ -24,7 +24,7 @@ class MultimodalRegistry: "Ernie4_5_VLMoeForConditionalGeneration", "Ernie5MoeForCausalLM", "Qwen2_5_VLForConditionalGeneration", - "Ernie5UnifyForCausalLM", + "Ernie5ForCausalLM", } @classmethod