File tree Expand file tree Collapse file tree
examples/clariden/cli/deepseek-ai Expand file tree Collapse file tree Original file line number Diff line number Diff line change 1+ #! /bin/bash
2+ # 1.6T params, fp8 block-quantised. 8 nodes x TP32 (32 GH200s).
3+ # Requires sglang with DeepseekV4ForCausalLM support and transformers >= 4.57.1.
4+ sml advanced \
5+ --firecrest-system clariden \
6+ --partition normal \
7+ --slurm-nodes-per-replica 8 \
8+ --slurm-time 3:00:00 \
9+ --serving-framework sglang \
10+ --slurm-environment src/swiss_ai_model_launch/assets/envs/sglang.toml \
11+ --framework-args " --model-path /capstor/store/cscs/swissai/infra01/hf_models/models/deepseek-ai/DeepSeek-V4-Pro-Base \
12+ --served-model-name deepseek-ai/DeepSeek-V4-Pro-Base-$( whoami) \
13+ --tp-size 32 \
14+ --host 0.0.0.0 \
15+ --trust-remote-code \
16+ --mem-fraction-static 0.85 \
17+ --enable-metrics"
Original file line number Diff line number Diff line change 1+ #! /bin/bash
2+ # Post-trained DeepSeek-V4-Pro, MXFP4-quantised (~806 GB on disk).
3+ # 4 nodes x TP16 mirrors V3.1 density. Requires sglang with MXFP4 dequant
4+ # kernels and DeepseekV4ForCausalLM support; transformers >= 4.57.1.
5+ sml advanced \
6+ --firecrest-system clariden \
7+ --partition normal \
8+ --slurm-nodes-per-replica 4 \
9+ --serving-framework sglang \
10+ --slurm-time 3:00:00 \
11+ --slurm-environment src/swiss_ai_model_launch/assets/envs/sglang.toml \
12+ --framework-args " --model-path /capstor/store/cscs/swissai/infra01/hf_models/models/deepseek-ai/DeepSeek-V4-Pro \
13+ --served-model-name deepseek-ai/DeepSeek-V4-Pro-$( whoami) \
14+ --tp-size 16 \
15+ --host 0.0.0.0 \
16+ --trust-remote-code \
17+ --mem-fraction-static 0.85 \
18+ --enable-metrics"
You can’t perform that action at this time.
0 commit comments