Skip to content

Commit 6242824

Browse files
committed
Use generic model path and container aliases for cluster portability
Replace cluster-specific paths with generic alias names that are resolved via srtslurm.yaml model_paths and containers mappings, as per upstream convention.
1 parent 493b0ee commit 6242824

29 files changed

Lines changed: 58 additions & 58 deletions

recipes/kimi2.5/trtllm_dynamo/disagg/gb200Nvfp4/ISL1K_OSL1K/MTP/ctx1dep4_gen1dep16_batch32_eplb0_mtp3.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ name: "kimi_k25_nvfp4_ISL1K_OSL1K_ctx1dep4_gen1dep16_batch32_eplb0_mtp3"
66
# concurrency: 666
77

88
model:
9-
path: "/mnt/lustre01/models/kimi-k2.5-nvfp4"
10-
container: "/mnt/lustre01/users/slurm-shared/yeswanthk/squashs/tensorrtllm-runtime-1.1.0-dev.2.sqsh"
9+
path: "kimi-k2.5-nvfp4"
10+
container: "tensorrtllm-runtime:1.1.0-dev.2"
1111
precision: "fp4"
1212

1313
resources:

recipes/kimi2.5/trtllm_dynamo/disagg/gb200Nvfp4/ISL1K_OSL1K/MTP/ctx1dep4_gen1dep32_batch16_eplb0_mtp3.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ name: "kimi_k25_nvfp4_ISL1K_OSL1K_ctx1dep4_gen1dep32_batch16_eplb0_mtp3"
66
# concurrency: 666
77

88
model:
9-
path: "/mnt/lustre01/models/kimi-k2.5-nvfp4"
10-
container: "/mnt/lustre01/users/slurm-shared/yeswanthk/squashs/tensorrtllm-runtime-1.1.0-dev.2.sqsh"
9+
path: "kimi-k2.5-nvfp4"
10+
container: "tensorrtllm-runtime:1.1.0-dev.2"
1111
precision: "fp4"
1212

1313
resources:

recipes/kimi2.5/trtllm_dynamo/disagg/gb200Nvfp4/ISL1K_OSL1K/MTP/ctx1dep4_gen1dep8_batch512_eplb0_mtp1.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ name: "kimi_k25_nvfp4_ISL1K_OSL1K_ctx1dep4_gen1dep8_batch512_eplb0_mtp1"
66
# concurrency: 4301
77

88
model:
9-
path: "/mnt/lustre01/models/kimi-k2.5-nvfp4"
10-
container: "/mnt/lustre01/users/slurm-shared/yeswanthk/squashs/tensorrtllm-runtime-1.1.0-dev.2.sqsh"
9+
path: "kimi-k2.5-nvfp4"
10+
container: "tensorrtllm-runtime:1.1.0-dev.2"
1111
precision: "fp4"
1212

1313
resources:

recipes/kimi2.5/trtllm_dynamo/disagg/gb200Nvfp4/ISL1K_OSL1K/MTP/ctx1dep4_gen4tep8_batch64_allconc_eplb0_mtp3.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ name: "kimi_k25_nvfp4_ISL1K_OSL1K_ctx1dep4_gen4tep8_batch64_allconc_eplb0_mtp3"
66
# Covers all gen4tep8 concurrencies: 8, 48, 92, 192, 336
77

88
model:
9-
path: "/mnt/lustre01/models/kimi-k2.5-nvfp4"
10-
container: "/mnt/lustre01/users/slurm-shared/yeswanthk/squashs/tensorrtllm-runtime-1.1.0-dev.2.sqsh"
9+
path: "kimi-k2.5-nvfp4"
10+
container: "tensorrtllm-runtime:1.1.0-dev.2"
1111
precision: "fp4"
1212

1313
resources:

recipes/kimi2.5/trtllm_dynamo/disagg/gb200Nvfp4/ISL1K_OSL1K/MTP/ctx1dep4_gen5tep4_batch2_allconc_eplb0_mtp3.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ name: "kimi_k25_nvfp4_ISL1K_OSL1K_ctx1dep4_gen5tep4_batch2_allconc_eplb0_mtp3"
66
# Covers all gen5tep4 concurrencies: 10, 15
77

88
model:
9-
path: "/mnt/lustre01/models/kimi-k2.5-nvfp4"
10-
container: "/mnt/lustre01/users/slurm-shared/yeswanthk/squashs/tensorrtllm-runtime-1.1.0-dev.2.sqsh"
9+
path: "kimi-k2.5-nvfp4"
10+
container: "tensorrtllm-runtime:1.1.0-dev.2"
1111
precision: "fp4"
1212

1313
resources:

recipes/kimi2.5/trtllm_dynamo/disagg/gb200Nvfp4/ISL1K_OSL1K/MTP/ctx2dep4_gen1dep16_batch128_eplb0_mtp1.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ name: "kimi_k25_nvfp4_ISL1K_OSL1K_ctx2dep4_gen1dep16_batch128_eplb0_mtp1"
66
# concurrency: 2253
77

88
model:
9-
path: "/mnt/lustre01/models/kimi-k2.5-nvfp4"
10-
container: "/mnt/lustre01/users/slurm-shared/yeswanthk/squashs/tensorrtllm-runtime-1.1.0-dev.2.sqsh"
9+
path: "kimi-k2.5-nvfp4"
10+
container: "tensorrtllm-runtime:1.1.0-dev.2"
1111
precision: "fp4"
1212

1313
resources:

recipes/kimi2.5/trtllm_dynamo/disagg/gb200Nvfp4/ISL1K_OSL1K/MTP/ctx2dep4_gen1dep32_batch64_eplb0_mtp1.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ name: "kimi_k25_nvfp4_ISL1K_OSL1K_ctx2dep4_gen1dep32_batch64_eplb0_mtp1"
66
# concurrency: 2253
77

88
model:
9-
path: "/mnt/lustre01/models/kimi-k2.5-nvfp4"
10-
container: "/mnt/lustre01/users/slurm-shared/yeswanthk/squashs/tensorrtllm-runtime-1.1.0-dev.2.sqsh"
9+
path: "kimi-k2.5-nvfp4"
10+
container: "tensorrtllm-runtime:1.1.0-dev.2"
1111
precision: "fp4"
1212

1313
resources:

recipes/kimi2.5/trtllm_dynamo/disagg/gb200Nvfp4/ISL1K_OSL1K/MTP/ctx2dep4_gen3dep8_batch256_eplb0_mtp1.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ name: "kimi_k25_nvfp4_ISL1K_OSL1K_ctx2dep4_gen3dep8_batch256_eplb0_mtp1"
66
# concurrency: 6759
77

88
model:
9-
path: "/mnt/lustre01/models/kimi-k2.5-nvfp4"
10-
container: "/mnt/lustre01/users/slurm-shared/yeswanthk/squashs/tensorrtllm-runtime-1.1.0-dev.2.sqsh"
9+
path: "kimi-k2.5-nvfp4"
10+
container: "tensorrtllm-runtime:1.1.0-dev.2"
1111
precision: "fp4"
1212

1313
resources:

recipes/kimi2.5/trtllm_dynamo/disagg/gb200Nvfp4/ISL1K_OSL1K/STP/ctx1dep4_gen1dep16_batch32_eplb0_mtp0.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ name: "kimi_k25_nvfp4_ISL1K_OSL1K_ctx1dep4_gen1dep16_batch32_eplb0_mtp0"
66
# concurrency: 666
77

88
model:
9-
path: "/mnt/lustre01/models/kimi-k2.5-nvfp4"
10-
container: "/mnt/lustre01/users/slurm-shared/yeswanthk/squashs/tensorrtllm-runtime-1.1.0-dev.2.sqsh"
9+
path: "kimi-k2.5-nvfp4"
10+
container: "tensorrtllm-runtime:1.1.0-dev.2"
1111
precision: "fp4"
1212

1313
resources:

recipes/kimi2.5/trtllm_dynamo/disagg/gb200Nvfp4/ISL1K_OSL1K/STP/ctx1dep4_gen1dep32_batch64_eplb0_mtp0.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ name: "kimi_k25_nvfp4_ISL1K_OSL1K_ctx1dep4_gen1dep32_batch64_eplb0_mtp0"
66
# concurrency: 2253
77

88
model:
9-
path: "/mnt/lustre01/models/kimi-k2.5-nvfp4"
10-
container: "/mnt/lustre01/users/slurm-shared/yeswanthk/squashs/tensorrtllm-runtime-1.1.0-dev.2.sqsh"
9+
path: "kimi-k2.5-nvfp4"
10+
container: "tensorrtllm-runtime:1.1.0-dev.2"
1111
precision: "fp4"
1212

1313
resources:

0 commit comments

Comments
 (0)