Skip to content

Commit ef192de

Browse files
lc5211The tunix Authors
authored andcommitted
[Tunix] Default degenerate_group_masking to false.
PiperOrigin-RevId: 926128256
1 parent 43cb3bd commit ef192de

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

tunix/rl/agentic/agentic_grpo_learner.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -107,7 +107,7 @@ class GRPOConfig(agentic_rl_learner.AgenticRLConfig):
107107
epsilon_high: float | None = None # 0.28 from DAPO.
108108
off_policy_steps: int = 0
109109
degenerate_group_masking: bool = (
110-
True # Whether to mask out degenerate groups with all-0 advantages.
110+
False # Whether to mask out degenerate groups with all-0 advantages.
111111
)
112112
use_rollout_logps: bool = True
113113
# Truncated importance-sampling (TIS) correction for the residual mismatch

0 commit comments

Comments
 (0)