vllm-project · DarkLight1337 · Sep 30, 2025 · Sep 29, 2025 · Sep 29, 2025
@@ -2467,7 +2467,7 @@ def propose_draft_token_ids(sampled_token_ids):
             effective_drafter_max_model_len = (
                 self.speculative_config.draft_model_config.max_model_len)
         input_fits_in_drafter = spec_decode_common_attn_metadata and (
-            spec_decode_common_attn_metadata.seq_lens.max() +
+            spec_decode_common_attn_metadata.max_seq_len +
             self.speculative_config.num_speculative_tokens
             <= effective_drafter_max_model_len)
         if use_padded_batch_for_eagle and input_fits_in_drafter: