Skip to content

Commit 36635d0

Browse files
author
pensieve-intern
committed
[OMNIML-4527] hidden_state_dump_support — pensieve-intern agent draft
1 parent 7a11fb2 commit 36635d0

1 file changed

Lines changed: 33 additions & 0 deletions

File tree

Lines changed: 33 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,33 @@
1+
# Hidden-state dump launcher for qwen3-v0344a-eagle3 (EAGLE3 step2).
2+
#
3+
# Standalone task extracted from the monolithic hf_offline_eagle3 pipeline.
4+
# Writes hidden states to /scratchspace/offline_hidden_states for step3.
5+
#
6+
# Usage:
7+
# uv run slurm.py --yaml examples/Qwen/qwen3-v0344a-eagle3/step2_hidden.yaml --dry-run
8+
9+
job_name: qwen3-v0344a-eagle3_EAGLE3_hidden_dump
10+
pipeline:
11+
allow_to_fail: false
12+
skip: false
13+
note:
14+
15+
global_vars:
16+
hf_model: /hf-local/Qwen/qwen3-v0344a-eagle3
17+
18+
task_0:
19+
script: common/eagle3/dump_offline_data.sh
20+
args:
21+
- --input-data /scratchspace/data
22+
- --output-dir /scratchspace/offline_hidden_states
23+
- --max-seq-len 8192
24+
- --tp 8
25+
- --moe-ep 8
26+
environment:
27+
- HF_MODEL_CKPT: <<global_vars.hf_model>>
28+
slurm_config:
29+
_factory_: "slurm_factory"
30+
nodes: 1
31+
ntasks_per_node: 8
32+
gpus_per_node: 8
33+
container: nvcr.io/nvidia/tensorrt-llm/release:1.2.0

0 commit comments

Comments
 (0)