Skip to content

Commit d491d80

Browse files
author
pensieve-intern
committed
[OMNIML-4686] synth_support — pensieve-intern agent draft
1 parent 62401e1 commit d491d80

2 files changed

Lines changed: 294 additions & 54 deletions

File tree

tools/launcher/examples/Qwen/Qwen3-8B/hf_offline_eagle3.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -43,7 +43,7 @@ pipeline:
4343
nodes: 1
4444
ntasks_per_node: 8
4545
gpus_per_node: 8
46-
container: nvcr.io/nvidia/tensorrt-llm/release:1.2.0
46+
container: nvcr.io/nvidia/tensorrt-llm/release:1.3.0rc10
4747

4848
# Step 2: Dump hidden states from target model
4949
task_1:
@@ -79,7 +79,7 @@ pipeline:
7979
nodes: 1
8080
ntasks_per_node: 1
8181
gpus_per_node: 8
82-
container: nvcr.io/nvidia/tensorrt-llm/release:1.2.0
82+
container: nvcr.io/nvidia/tensorrt-llm/release:1.3.0rc10
8383

8484
# Step 4: Benchmark speculative decoding (VLLM backend)
8585
task_3:

0 commit comments

Comments
 (0)