We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 62401e1 commit d491d80Copy full SHA for d491d80
2 files changed
tools/launcher/examples/Qwen/Qwen3-8B/hf_offline_eagle3.yaml
@@ -43,7 +43,7 @@ pipeline:
43
nodes: 1
44
ntasks_per_node: 8
45
gpus_per_node: 8
46
- container: nvcr.io/nvidia/tensorrt-llm/release:1.2.0
+ container: nvcr.io/nvidia/tensorrt-llm/release:1.3.0rc10
47
48
# Step 2: Dump hidden states from target model
49
task_1:
@@ -79,7 +79,7 @@ pipeline:
79
80
ntasks_per_node: 1
81
82
83
84
# Step 4: Benchmark speculative decoding (VLLM backend)
85
task_3:
0 commit comments