forked from yuzhTHU/MySRAgent
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathbench_sr_agent.sh
More file actions
executable file
·34 lines (29 loc) · 983 Bytes
/
bench_sr_agent.sh
File metadata and controls
executable file
·34 lines (29 loc) · 983 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
conda activate ./venv
python bench_sr_agent.py \
--problem_names MatSci2 MatSci19 CRK28 BPG1 PO6 \
--exp_name guanren_tests \
--no-skip-existing \
-L 20 -K 2 -R 5 -C 2 \
--llm-provider openrouter \
--llm-model qwen/qwen3.5-flash-02-23
python bench_sr_agent.py \
--problem_names MatSci2 MatSci19 CRK28 BPG1 PO6 \
--name guanren_tests_gpt-5.5 \
--no-skip-existing \
-L 20 -K 2 -R 1 -C 2 \
--llm-provider openrouter \
--llm-model openai/gpt-5.5
python bench_sr_agent.py \
--problem_names MatSci2 MatSci19 CRK28 BPG1 PO6 \
--name guanren_tests_qwen3.6-plus \
--no-skip-existing \
-L 20 -K 2 -R 1 -C 2 \
--llm-provider openrouter \
--llm-model qwen/qwen3.6-plus
python bench_sr_agent.py \
--problem_names MatSci2 MatSci19 CRK28 BPG1 PO6 \
--name guanren_tests_deepseek-v4-pro \
--no-skip-existing \
-L 20 -K 2 -R 1 -C 2 \
--llm-provider openrouter \
--llm-model deepseek/deepseek-v4-pro