Skip to content

Commit 4ef6523

Browse files
committed
add deepseek v4 attempt
1 parent 7fe37d4 commit 4ef6523

2 files changed

Lines changed: 35 additions & 0 deletions

File tree

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,17 @@
1+
#!/bin/bash
2+
# 1.6T params, fp8 block-quantised. 8 nodes x TP32 (32 GH200s).
3+
# Requires sglang with DeepseekV4ForCausalLM support and transformers >= 4.57.1.
4+
sml advanced \
5+
--firecrest-system clariden \
6+
--partition normal \
7+
--slurm-nodes-per-replica 8 \
8+
--slurm-time 3:00:00 \
9+
--serving-framework sglang \
10+
--slurm-environment src/swiss_ai_model_launch/assets/envs/sglang.toml \
11+
--framework-args "--model-path /capstor/store/cscs/swissai/infra01/hf_models/models/deepseek-ai/DeepSeek-V4-Pro-Base \
12+
--served-model-name deepseek-ai/DeepSeek-V4-Pro-Base-$(whoami) \
13+
--tp-size 32 \
14+
--host 0.0.0.0 \
15+
--trust-remote-code \
16+
--mem-fraction-static 0.85 \
17+
--enable-metrics"
Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,18 @@
1+
#!/bin/bash
2+
# Post-trained DeepSeek-V4-Pro, MXFP4-quantised (~806 GB on disk).
3+
# 4 nodes x TP16 mirrors V3.1 density. Requires sglang with MXFP4 dequant
4+
# kernels and DeepseekV4ForCausalLM support; transformers >= 4.57.1.
5+
sml advanced \
6+
--firecrest-system clariden \
7+
--partition normal \
8+
--slurm-nodes-per-replica 4 \
9+
--serving-framework sglang \
10+
--slurm-time 3:00:00 \
11+
--slurm-environment src/swiss_ai_model_launch/assets/envs/sglang.toml \
12+
--framework-args "--model-path /capstor/store/cscs/swissai/infra01/hf_models/models/deepseek-ai/DeepSeek-V4-Pro \
13+
--served-model-name deepseek-ai/DeepSeek-V4-Pro-$(whoami) \
14+
--tp-size 16 \
15+
--host 0.0.0.0 \
16+
--trust-remote-code \
17+
--mem-fraction-static 0.85 \
18+
--enable-metrics"

0 commit comments

Comments
 (0)