Skip to content

Commit 3c85d03

Browse files
authored
Merge pull request #695 from NVIDIA/am/bug-4641151
Fix CLI arg for kvbench
2 parents 8291948 + 64ebd40 commit 3c85d03

File tree

3 files changed

+4
-4
lines changed

3 files changed

+4
-4
lines changed

src/cloudai/workloads/nixl_kvbench/slurm_command_gen_strategy.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -69,6 +69,6 @@ def gen_kvbench_command(self) -> list[str]:
6969
for k, v in self.test_run.test.test_definition.cmd_args_dict.items():
7070
command.append(f"--{k} {v}")
7171

72-
command.append("--etcd-endpoints http://$NIXL_ETCD_ENDPOINTS")
72+
command.append("--etcd_endpoints http://$NIXL_ETCD_ENDPOINTS")
7373

7474
return command

tests/ref_data/nixl-kvbench.sbatch

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ timeout 60 bash -c "until curl -s $NIXL_ETCD_ENDPOINTS/health > /dev/null 2>&1;
2222
echo "ETCD ($NIXL_ETCD_ENDPOINTS) was unreachable after 60 seconds";
2323
exit 1
2424
}
25-
srun --export=ALL --mpi=pmix --container-image=url.com/docker:tag --container-mounts=__OUTPUT_DIR__/output:/cloudai_run_results,__OUTPUT_DIR__/install:/cloudai_install,__OUTPUT_DIR__/output --overlap --relative=0 --ntasks-per-node=1 --ntasks=1 -N1 bash -c "source __OUTPUT_DIR__/output/env_vars.sh; path/to/python path/to/kvbench_script.sh profile --backend UCX --etcd-endpoints http://$NIXL_ETCD_ENDPOINTS" &
25+
srun --export=ALL --mpi=pmix --container-image=url.com/docker:tag --container-mounts=__OUTPUT_DIR__/output:/cloudai_run_results,__OUTPUT_DIR__/install:/cloudai_install,__OUTPUT_DIR__/output --overlap --relative=0 --ntasks-per-node=1 --ntasks=1 -N1 bash -c "source __OUTPUT_DIR__/output/env_vars.sh; path/to/python path/to/kvbench_script.sh profile --backend UCX --etcd_endpoints http://$NIXL_ETCD_ENDPOINTS" &
2626
sleep 15
27-
srun --export=ALL --mpi=pmix --container-image=url.com/docker:tag --container-mounts=__OUTPUT_DIR__/output:/cloudai_run_results,__OUTPUT_DIR__/install:/cloudai_install,__OUTPUT_DIR__/output --overlap --relative=1 --ntasks-per-node=1 --ntasks=1 -N1 bash -c "source __OUTPUT_DIR__/output/env_vars.sh; path/to/python path/to/kvbench_script.sh profile --backend UCX --etcd-endpoints http://$NIXL_ETCD_ENDPOINTS"
27+
srun --export=ALL --mpi=pmix --container-image=url.com/docker:tag --container-mounts=__OUTPUT_DIR__/output:/cloudai_run_results,__OUTPUT_DIR__/install:/cloudai_install,__OUTPUT_DIR__/output --overlap --relative=1 --ntasks-per-node=1 --ntasks=1 -N1 bash -c "source __OUTPUT_DIR__/output/env_vars.sh; path/to/python path/to/kvbench_script.sh profile --backend UCX --etcd_endpoints http://$NIXL_ETCD_ENDPOINTS"
2828
kill -9 $etcd_pid

tests/slurm_command_gen_strategy/test_nixl_kvbench_command_gen.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -70,5 +70,5 @@ def test_gen_kvbench_ucx(kvbench_tr: TestRun, slurm_system: SlurmSystem):
7070
"--model_config ./cfg.yaml",
7171
"--source src",
7272
"--op_type READ",
73-
"--etcd-endpoints http://$NIXL_ETCD_ENDPOINTS",
73+
"--etcd_endpoints http://$NIXL_ETCD_ENDPOINTS",
7474
]

0 commit comments

Comments
 (0)