Skip to content

Commit 5b8c30d

Browse files
authored
[Spec Decode, BugFix] Propagate norm_before_fc from Eagle3 speculator (vllm-project#38111)
Signed-off-by: Shubhra Pandit <shubhra.pandit@gmail.com>
1 parent d39b8da commit 5b8c30d

File tree

1 file changed

+2
-0
lines changed
  • vllm/transformers_utils/configs/speculators

1 file changed

+2
-0
lines changed

vllm/transformers_utils/configs/speculators/algos.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,7 @@ def update_eagle3(config_dict: dict, pre_trained_config: dict) -> None:
2222
- draft_vocab_size: Size of the draft model's vocabulary
2323
- target_hidden_size: Hidden size of the target model
2424
- norm_before_residual: Whether to apply norm before residual connection
25+
- norm_before_fc: Whether to apply RMSNorm before the fc projection
2526
- eagle_aux_hidden_state_layer_ids: List of layer indices from the base
2627
model to use as auxiliary inputs for the Eagle3 drafter. These layers
2728
provide intermediate hidden states that help the drafter make better
@@ -34,6 +35,7 @@ def update_eagle3(config_dict: dict, pre_trained_config: dict) -> None:
3435
pre_trained_config["norm_before_residual"] = config_dict.get(
3536
"norm_before_residual", True
3637
)
38+
pre_trained_config["norm_before_fc"] = config_dict.get("norm_before_fc", False)
3739
pre_trained_config["architectures"] = ["Eagle3LlamaForCausalLM"]
3840
if config_dict.get("eagle_aux_hidden_state_layer_ids"):
3941
pre_trained_config["eagle_aux_hidden_state_layer_ids"] = config_dict[

0 commit comments

Comments
 (0)