@@ -14,9 +14,12 @@ dashboard_info:
1414# Base configuration
1515recipe_subdir : amplify_accelerate_te_fp8
1616branch : jwilber/add-wandb-recipe-amplify
17+ commit_sha : " "
1718train_cmnd : train
1819
1920wandb_init_args :
21+ project : " amplify_accelerate_te_fp8"
22+ group : " recipes_model_convergence"
2023 mode : " online" # need online to collect logs; if offline, must manually sync after run
2124
2225stop_after_n_steps : 10
@@ -33,14 +36,20 @@ products:
3336
3437script : |
3538 git clone https://github.com/NVIDIA/bionemo-framework.git
36- if [ "${branch}" != "main" ]; then
37- cd bionemo-framework
39+ cd bionemo-framework
40+ if [ -n "${commit_sha}" ]; then
41+ echo "Checking out commit: ${commit_sha}"
42+ git checkout "${commit_sha}"
43+ elif [ "${branch}" != "main" ]; then
44+ echo "Checking out branch: ${branch}"
3845 git checkout "${branch}"
39- cd ..
4046 fi
47+ cd ..
4148 cd bionemo-framework/recipes/${recipe_subdir}
4249 pip install -r requirements.txt
4350 torchrun ${train_cmnd}.py \
4451 --config-name ${config}.yaml \
45- stop_after_n_steps=${stop_after_n_steps} \
46- trainer.report_to=${trainer.report_to}
52+ trainer.report_to=${trainer.report_to} \
53+ wandb_init_args.mode=${wandb_init_args.mode} \
54+ wandb_init_args.project=${wandb_init_args.project} \
55+ +wandb_init_args.group=${wandb_init_args.group} \
0 commit comments