Skip to content

Commit d31133c

Browse files
committed
make the run really long to avoid triggering finished run, like in finetuning
1 parent a7bda6f commit d31133c

1 file changed

Lines changed: 6 additions & 0 deletions

File tree

olmoearth_pretrain/internal/full_eval_sweep.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -515,6 +515,10 @@ def _get_pooling_type_str(pooling_type: str) -> str:
515515

516516

517517
LAUNCH_OVERRIDES = "--launch.priority=high --launch.num_gpus=1 --launch.task_name=eval"
518+
# Overwrite the max duration to enable eval of the last step of the checkpoint
519+
MAX_DURATION_OVERRIDE = (
520+
"--trainer.max_duration.value=10000000 --trainer.max_duration.unit=steps"
521+
)
518522

519523

520524
def _get_env_prefix(args: argparse.Namespace, module_path: str) -> str:
@@ -989,6 +993,8 @@ def build_commands(args: argparse.Namespace, extra_cli: list[str]) -> list[str]:
989993
commands_to_run_new.append(cmd)
990994
commands_to_run = commands_to_run_new
991995

996+
commands_to_run = [f"{cmd} {MAX_DURATION_OVERRIDE}" for cmd in commands_to_run]
997+
992998
# Filter out skipped tasks if task-skip-names is provided
993999
if args.task_skip_names:
9941000
skip_names = [name.strip() for name in args.task_skip_names.split(",")]

0 commit comments

Comments
 (0)