Skip to content

Commit 366b647

Browse files
committed
Cleanup tomls
1 parent b50d484 commit 366b647

File tree

5 files changed

+32
-63
lines changed

5 files changed

+32
-63
lines changed
Lines changed: 28 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
name = "vllm"
2+
description = "vllm"
3+
test_template_name = "AIDynamo"
4+
5+
[cmd_args]
6+
docker_image_url = "nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.6.1.post1"
7+
8+
[cmd_args.dynamo]
9+
backend = "vllm"
10+
11+
[cmd_args.genai_perf]
12+
endpoint = "v1/chat/completions"
13+
endpoint-type = "chat"
14+
extra-inputs = 'min_tokens:10'
15+
output-tokens-mean = 500
16+
output-tokens-stddev = 0
17+
random-seed = 123
18+
request-count = 20
19+
synthetic-input-tokens-mean = 3000
20+
synthetic-input-tokens-stddev = 0
21+
warmup-request-count = 10
22+
concurrency = 1
23+
extra-args = "--streaming -- -v --async"
24+
25+
[extra_env_vars]
26+
UCX_LOG_LEVEL = "warn"
27+
UCX_TLS = "cuda_copy,rc_x"
28+
DYNAMO_NODELIST = "$(scontrol show hostname $SLURM_JOB_NODELIST | tr -s '\\n' ',')"

conf/staging/ai_dynamo/test_scenario/vllm_k8s.toml renamed to conf/experimental/ai_dynamo/test_scenario/vllm_k8s.toml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,11 @@
11
name = "vllm_k8s"
22

33
[[Tests]]
4-
id = "Tests.1"
4+
id = "dynamo.vllm"
55
test_name = "vllm"
66

77
[Tests.cmd_args]
8-
docker_image_url = "gitlab-master.nvidia.com#dl/ai-dynamo/dynamo:e82bc4ec960111b369260e1758072c93227b66bf-32414403-vllm-amd64"
8+
docker_image_url = "nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.6.1.post1"
99
dynamo_graph_path = "conf/staging/ai_dynamo/test/agg.yaml"
1010
[Tests.cmd_args.dynamo]
1111
[Tests.cmd_args.dynamo.prefill_worker]

conf/staging/ai_dynamo/test/vllm.toml

Lines changed: 0 additions & 59 deletions
This file was deleted.

doc/workloads/ai_dynamo.rst

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -52,5 +52,5 @@ Run CloudAI to deploy AI Dynamo worker nodes according to your spec and run ``ge
5252
.. code-block:: bash
5353
5454
uv run cloudai run --system-config <k8s system toml> \
55-
--tests-dir conf/staging/ai_dynamo/test \
56-
--test-scenario conf/staging/ai_dynamo/test_scenario/vllm_k8s.toml
55+
--tests-dir conf/experimental/ai_dynamo/test \
56+
--test-scenario conf/experimental/ai_dynamo/test_scenario/vllm_k8s.toml

0 commit comments

Comments
 (0)