We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e511d0f commit ad6e4dcCopy full SHA for ad6e4dc
prompting/rewards/exact_match.py
@@ -121,8 +121,6 @@ async def reward(
121
122
elif check_idx == eos_idx and completion_length < max_tokens:
123
if eos_token and eos_token not in verification_logits:
124
- # TODO: Make top_k equal to top_logprobs.
125
- # Do not set full penalty since top_k > top_logprobs.
126
penalty = NO_EOS_PENALTY
127
raise ValueError("Partial completion")
128
0 commit comments