Skip to content

Commit 7ac2a68

Browse files
author
pensieve-intern
committed
[OMNIML-4600] hidden_state_dump_support — pensieve-intern agent draft
1 parent 7a11fb2 commit 7ac2a68

1 file changed

Lines changed: 33 additions & 0 deletions

File tree

Lines changed: 33 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,33 @@
1+
# Step 2 hidden-state dump for qwen3-v0350a-eagle3 (EAGLE3 offline pipeline).
2+
#
3+
# Standalone task that dumps hidden states from the target model.
4+
# Output goes to /scratchspace/offline_hidden_states for consumption by step 3.
5+
#
6+
# Usage:
7+
# uv run slurm.py --yaml examples/Qwen/qwen3-v0350a-eagle3/step2_hidden.yaml --dry-run
8+
9+
job_name: qwen3-v0350a-eagle3_EAGLE3_hidden_dump
10+
pipeline:
11+
allow_to_fail: false
12+
skip: false
13+
note:
14+
15+
global_vars:
16+
hf_model: /hf-local/Qwen/qwen3-v0350a-eagle3
17+
18+
task_0:
19+
script: common/eagle3/dump_offline_data.sh
20+
args:
21+
- --input-data /scratchspace/data
22+
- --output-dir /scratchspace/offline_hidden_states
23+
- --max-seq-len 8192
24+
- --tp 8
25+
- --moe-ep 8
26+
environment:
27+
- HF_MODEL_CKPT: <<global_vars.hf_model>>
28+
slurm_config:
29+
_factory_: "slurm_factory"
30+
nodes: 1
31+
ntasks_per_node: 8
32+
gpus_per_node: 8
33+
container: nvcr.io/nvidia/tensorrt-llm/release:1.2.0

0 commit comments

Comments
 (0)