Skip to content

Commit 284f17b

Browse files
committed
config
1 parent 1cf585f commit 284f17b

24 files changed

+72
-72
lines changed

scripts/partial_rollout/deepseek/dapo/run-deepseek-r1-distill-qwen-1.5B-dapo-partial.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -95,7 +95,7 @@ ROLLOUT_ARGS=(
9595
EVAL_ARGS=(
9696
--eval-interval 10
9797
--eval-prompt-data aime ${DATA_DIR}/aime-2024/aime-2024.jsonl
98-
--n-samples-per-eval-prompt 4
98+
--n-samples-per-eval-prompt 16
9999
--eval-max-response-len 16384
100100
--eval-top-p 0.7
101101
)
@@ -138,7 +138,7 @@ OPTIMIZER_ARGS=(
138138

139139
WANDB_ARGS=(
140140
--use-wandb
141-
--wandb-project 4B-amd
141+
--wandb-project APRIL
142142
--wandb-group dapo-deepseek-r1-distill-qwen-1.5B-dapo-partial
143143
--wandb-key ${WANDB_API_KEY}
144144
)
@@ -151,7 +151,7 @@ WANDB_ARGS=(
151151
# )
152152
SGLANG_ARGS=(
153153
--rollout-num-gpus-per-engine 2
154-
--sglang-mem-fraction-static 0.4
154+
--sglang-mem-fraction-static 0.6
155155
)
156156
####################
157157

scripts/partial_rollout/deepseek/dapo/run-deepseek-r1-distill-qwen-1.5B-dapo.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -95,7 +95,7 @@ ROLLOUT_ARGS=(
9595
EVAL_ARGS=(
9696
--eval-interval 10
9797
--eval-prompt-data aime ${DATA_DIR}/aime-2024/aime-2024.jsonl
98-
--n-samples-per-eval-prompt 4
98+
--n-samples-per-eval-prompt 16
9999
--eval-max-response-len 16384
100100
--eval-top-p 0.7
101101
)
@@ -138,7 +138,7 @@ OPTIMIZER_ARGS=(
138138

139139
WANDB_ARGS=(
140140
--use-wandb
141-
--wandb-project 4B-amd
141+
--wandb-project APRIL
142142
--wandb-group dapo-deepseek-r1-distill-qwen-1.5B-dapo
143143
--wandb-key ${WANDB_API_KEY}
144144
)
@@ -151,7 +151,7 @@ WANDB_ARGS=(
151151
# )
152152
SGLANG_ARGS=(
153153
--rollout-num-gpus-per-engine 2
154-
--sglang-mem-fraction-static 0.4
154+
--sglang-mem-fraction-static 0.6
155155
)
156156
####################
157157

scripts/partial_rollout/deepseek/dapo/run-deepseek-r1-distill-qwen-1.5B-deepscaler-partial.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -95,7 +95,7 @@ ROLLOUT_ARGS=(
9595
EVAL_ARGS=(
9696
--eval-interval 10
9797
--eval-prompt-data aime ${DATA_DIR}/aime-2024/aime-2024.jsonl
98-
--n-samples-per-eval-prompt 4
98+
--n-samples-per-eval-prompt 16
9999
--eval-max-response-len 16384
100100
--eval-top-p 0.7
101101
)
@@ -138,7 +138,7 @@ OPTIMIZER_ARGS=(
138138

139139
WANDB_ARGS=(
140140
--use-wandb
141-
--wandb-project 4B-amd
141+
--wandb-project APRIL
142142
--wandb-group deepscaler-deepseek-r1-distill-qwen-1.5B-dapo-partial
143143
--wandb-key ${WANDB_API_KEY}
144144
)
@@ -151,7 +151,7 @@ WANDB_ARGS=(
151151
# )
152152
SGLANG_ARGS=(
153153
--rollout-num-gpus-per-engine 2
154-
--sglang-mem-fraction-static 0.4
154+
--sglang-mem-fraction-static 0.6
155155
)
156156
####################
157157

scripts/partial_rollout/deepseek/dapo/run-deepseek-r1-distill-qwen-1.5B-deepscaler.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -95,7 +95,7 @@ ROLLOUT_ARGS=(
9595
EVAL_ARGS=(
9696
--eval-interval 10
9797
--eval-prompt-data aime ${DATA_DIR}/aime-2024/aime-2024.jsonl
98-
--n-samples-per-eval-prompt 4
98+
--n-samples-per-eval-prompt 16
9999
--eval-max-response-len 16384
100100
--eval-top-p 0.7
101101
)
@@ -138,7 +138,7 @@ OPTIMIZER_ARGS=(
138138

139139
WANDB_ARGS=(
140140
--use-wandb
141-
--wandb-project 4B-amd
141+
--wandb-project APRIL
142142
--wandb-group deepscaler-deepseek-r1-distill-qwen-1.5B-dapo
143143
--wandb-key ${WANDB_API_KEY}
144144
)
@@ -151,7 +151,7 @@ WANDB_ARGS=(
151151
# )
152152
SGLANG_ARGS=(
153153
--rollout-num-gpus-per-engine 2
154-
--sglang-mem-fraction-static 0.4
154+
--sglang-mem-fraction-static 0.6
155155
)
156156
####################
157157

scripts/partial_rollout/deepseek/grpo/run-deepseek-r1-distill-qwen-1.5B-dapo-partial.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,7 @@ ROLLOUT_ARGS=(
9494
EVAL_ARGS=(
9595
--eval-interval 10
9696
--eval-prompt-data aime ${DATA_DIR}/aime-2024/aime-2024.jsonl
97-
--n-samples-per-eval-prompt 4
97+
--n-samples-per-eval-prompt 16
9898
--eval-max-response-len 16384
9999
--eval-top-p 0.7
100100
)
@@ -137,7 +137,7 @@ OPTIMIZER_ARGS=(
137137

138138
WANDB_ARGS=(
139139
--use-wandb
140-
--wandb-project 4B-amd
140+
--wandb-project APRIL
141141
--wandb-group dapo-deepseek-r1-distill-qwen-1.5B-grpo-partial
142142
--wandb-key ${WANDB_API_KEY}
143143
)
@@ -150,7 +150,7 @@ WANDB_ARGS=(
150150
# )
151151
SGLANG_ARGS=(
152152
--rollout-num-gpus-per-engine 2
153-
--sglang-mem-fraction-static 0.4
153+
--sglang-mem-fraction-static 0.6
154154
)
155155
####################
156156

scripts/partial_rollout/deepseek/grpo/run-deepseek-r1-distill-qwen-1.5B-dapo.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,7 @@ ROLLOUT_ARGS=(
9494
EVAL_ARGS=(
9595
--eval-interval 10
9696
--eval-prompt-data aime ${DATA_DIR}/aime-2024/aime-2024.jsonl
97-
--n-samples-per-eval-prompt 4
97+
--n-samples-per-eval-prompt 16
9898
--eval-max-response-len 16384
9999
--eval-top-p 0.7
100100
)
@@ -137,7 +137,7 @@ OPTIMIZER_ARGS=(
137137

138138
WANDB_ARGS=(
139139
--use-wandb
140-
--wandb-project 4B-amd
140+
--wandb-project APRIL
141141
--wandb-group dapo-deepseek-r1-distill-qwen-1.5B-grpo
142142
--wandb-key ${WANDB_API_KEY}
143143
)
@@ -150,7 +150,7 @@ WANDB_ARGS=(
150150
# )
151151
SGLANG_ARGS=(
152152
--rollout-num-gpus-per-engine 2
153-
--sglang-mem-fraction-static 0.4
153+
--sglang-mem-fraction-static 0.6
154154
)
155155
####################
156156

scripts/partial_rollout/deepseek/grpo/run-deepseek-r1-distill-qwen-1.5B-deepscaler-partial.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,7 @@ ROLLOUT_ARGS=(
9494
EVAL_ARGS=(
9595
--eval-interval 10
9696
--eval-prompt-data aime ${DATA_DIR}/aime-2024/aime-2024.jsonl
97-
--n-samples-per-eval-prompt 4
97+
--n-samples-per-eval-prompt 16
9898
--eval-max-response-len 16384
9999
--eval-top-p 0.7
100100
)
@@ -137,7 +137,7 @@ OPTIMIZER_ARGS=(
137137

138138
WANDB_ARGS=(
139139
--use-wandb
140-
--wandb-project 4B-amd
140+
--wandb-project APRIL
141141
--wandb-group deepscaler-deepseek-r1-distill-qwen-1.5B-grpo-partial
142142
--wandb-key ${WANDB_API_KEY}
143143
)
@@ -150,7 +150,7 @@ WANDB_ARGS=(
150150
# )
151151
SGLANG_ARGS=(
152152
--rollout-num-gpus-per-engine 2
153-
--sglang-mem-fraction-static 0.4
153+
--sglang-mem-fraction-static 0.6
154154
)
155155
####################
156156

scripts/partial_rollout/deepseek/grpo/run-deepseek-r1-distill-qwen-1.5B-deepscaler.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,7 @@ ROLLOUT_ARGS=(
9494
EVAL_ARGS=(
9595
--eval-interval 10
9696
--eval-prompt-data aime ${DATA_DIR}/aime-2024/aime-2024.jsonl
97-
--n-samples-per-eval-prompt 4
97+
--n-samples-per-eval-prompt 16
9898
--eval-max-response-len 16384
9999
--eval-top-p 0.7
100100
)
@@ -137,7 +137,7 @@ OPTIMIZER_ARGS=(
137137

138138
WANDB_ARGS=(
139139
--use-wandb
140-
--wandb-project 4B-amd
140+
--wandb-project APRIL
141141
--wandb-group deepscaler-deepseek-r1-distill-qwen-1.5B-grpo
142142
--wandb-key ${WANDB_API_KEY}
143143
)
@@ -150,7 +150,7 @@ WANDB_ARGS=(
150150
# )
151151
SGLANG_ARGS=(
152152
--rollout-num-gpus-per-engine 2
153-
--sglang-mem-fraction-static 0.4
153+
--sglang-mem-fraction-static 0.6
154154
)
155155
####################
156156

scripts/partial_rollout/deepseek/gspo/run-deepseek-r1-distill-qwen-1.5B-dapo-partial.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,7 @@ ROLLOUT_ARGS=(
9494
EVAL_ARGS=(
9595
--eval-interval 10
9696
--eval-prompt-data aime ${DATA_DIR}/aime-2024/aime-2024.jsonl
97-
--n-samples-per-eval-prompt 4
97+
--n-samples-per-eval-prompt 16
9898
--eval-max-response-len 16384
9999
--eval-top-p 0.7
100100
)
@@ -137,7 +137,7 @@ OPTIMIZER_ARGS=(
137137

138138
WANDB_ARGS=(
139139
--use-wandb
140-
--wandb-project 4B-amd
140+
--wandb-project APRIL
141141
--wandb-group dapo-deepseek-r1-distill-qwen-1.5B-gspo-partial
142142
--wandb-key ${WANDB_API_KEY}
143143
)
@@ -150,7 +150,7 @@ WANDB_ARGS=(
150150
# )
151151
SGLANG_ARGS=(
152152
--rollout-num-gpus-per-engine 2
153-
--sglang-mem-fraction-static 0.4
153+
--sglang-mem-fraction-static 0.6
154154
)
155155
####################
156156

scripts/partial_rollout/deepseek/gspo/run-deepseek-r1-distill-qwen-1.5B-dapo.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,7 @@ ROLLOUT_ARGS=(
9494
EVAL_ARGS=(
9595
--eval-interval 10
9696
--eval-prompt-data aime ${DATA_DIR}/aime-2024/aime-2024.jsonl
97-
--n-samples-per-eval-prompt 4
97+
--n-samples-per-eval-prompt 16
9898
--eval-max-response-len 16384
9999
--eval-top-p 0.7
100100
)
@@ -137,7 +137,7 @@ OPTIMIZER_ARGS=(
137137

138138
WANDB_ARGS=(
139139
--use-wandb
140-
--wandb-project 4B-amd
140+
--wandb-project APRIL
141141
--wandb-group dapo-deepseek-r1-distill-qwen-1.5B-gspo
142142
--wandb-key ${WANDB_API_KEY}
143143
)
@@ -150,7 +150,7 @@ WANDB_ARGS=(
150150
# )
151151
SGLANG_ARGS=(
152152
--rollout-num-gpus-per-engine 2
153-
--sglang-mem-fraction-static 0.4
153+
--sglang-mem-fraction-static 0.6
154154
)
155155
####################
156156

0 commit comments

Comments
 (0)