File tree Expand file tree Collapse file tree 5 files changed +32
-63
lines changed
Expand file tree Collapse file tree 5 files changed +32
-63
lines changed File renamed without changes.
Original file line number Diff line number Diff line change 1+ name = " vllm"
2+ description = " vllm"
3+ test_template_name = " AIDynamo"
4+
5+ [cmd_args ]
6+ docker_image_url = " nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.6.1.post1"
7+
8+ [cmd_args .dynamo ]
9+ backend = " vllm"
10+
11+ [cmd_args .genai_perf ]
12+ endpoint = " v1/chat/completions"
13+ endpoint-type = " chat"
14+ extra-inputs = ' min_tokens:10'
15+ output-tokens-mean = 500
16+ output-tokens-stddev = 0
17+ random-seed = 123
18+ request-count = 20
19+ synthetic-input-tokens-mean = 3000
20+ synthetic-input-tokens-stddev = 0
21+ warmup-request-count = 10
22+ concurrency = 1
23+ extra-args = " --streaming -- -v --async"
24+
25+ [extra_env_vars ]
26+ UCX_LOG_LEVEL = " warn"
27+ UCX_TLS = " cuda_copy,rc_x"
28+ DYNAMO_NODELIST = " $(scontrol show hostname $SLURM_JOB_NODELIST | tr -s '\\ n' ',')"
Original file line number Diff line number Diff line change 11name = " vllm_k8s"
22
33[[Tests ]]
4- id = " Tests.1 "
4+ id = " dynamo.vllm "
55test_name = " vllm"
66
77 [Tests .cmd_args ]
8- docker_image_url = " gitlab-master. nvidia.com#dl /ai-dynamo/dynamo:e82bc4ec960111b369260e1758072c93227b66bf-32414403- vllm-amd64 "
8+ docker_image_url = " nvcr.io/ nvidia/ai-dynamo/vllm-runtime:0.6.1.post1 "
99 dynamo_graph_path = " conf/staging/ai_dynamo/test/agg.yaml"
1010 [Tests .cmd_args .dynamo ]
1111 [Tests .cmd_args .dynamo .prefill_worker ]
Load Diff This file was deleted.
Original file line number Diff line number Diff line change @@ -52,5 +52,5 @@ Run CloudAI to deploy AI Dynamo worker nodes according to your spec and run ``ge
5252.. code-block :: bash
5353
5454 uv run cloudai run --system-config < k8s system toml> \
55- --tests-dir conf/staging /ai_dynamo/test \
56- --test-scenario conf/staging /ai_dynamo/test_scenario/vllm_k8s.toml
55+ --tests-dir conf/experimental /ai_dynamo/test \
56+ --test-scenario conf/experimental /ai_dynamo/test_scenario/vllm_k8s.toml
You can’t perform that action at this time.
0 commit comments