Skip to content

Commit 862f9ef

Browse files
committed
chore: update
1 parent b8dbbfe commit 862f9ef

File tree

2 files changed

+8
-3
lines changed

2 files changed

+8
-3
lines changed

examples/aime_eval.py

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -65,7 +65,12 @@ def _create_sglang_factory(model_id: str | None, sglang_base_url: str) -> ModelF
6565

6666
tokenizer = AutoTokenizer.from_pretrained(model_id, trust_remote_code=True)
6767
client = SGLangClient(base_url)
68-
return sglang_model_factory(model_id=model_id, tokenizer=tokenizer, client=client)
68+
return sglang_model_factory(
69+
model_id=model_id,
70+
tokenizer=tokenizer,
71+
client=client,
72+
sampling_params={"max_new_tokens": 16384, "temperature": 0.7, "top_p": 0.95, "top_k": 20},
73+
)
6974

7075

7176
def _create_bedrock_factory(model_id: str | None) -> ModelFactory:
@@ -131,7 +136,7 @@ async def run_eval(
131136
reward_fn = MathRewardFunction()
132137

133138
async def env_factory(_):
134-
env = SimpleMathEnv(model_factory=model_factory, reward_fn=reward_fn)
139+
env = SimpleMathEnv(model_factory=model_factory, reward_fn=reward_fn, verbose=False)
135140
env.get_tools = lambda: []
136141
return env
137142

examples/math_env.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -77,7 +77,7 @@ def _create_sglang_factory(model_id: str | None, sglang_base_url: str) -> ModelF
7777
def _create_bedrock_factory(model_id: str | None) -> ModelFactory:
7878
import boto3
7979

80-
model_id = model_id or "us.anthropic.claude-sonnet-4-20250514"
80+
model_id = model_id or "us.anthropic.claude-sonnet-4-20250514-v1:0"
8181
click.echo(f"Using Bedrock model: {model_id}")
8282
return bedrock_model_factory(model_id=model_id, boto_session=boto3.Session())
8383

0 commit comments

Comments
 (0)