Skip to content

Commit 7f48566

Browse files
2 parents 576634b + 0f21594 commit 7f48566

4 files changed

Lines changed: 572 additions & 149 deletions

File tree

.github/workflows/test_cli_cuda_vllm.yaml

Lines changed: 0 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -38,10 +38,6 @@ jobs:
3838
runs-on:
3939
group: aws-g5-4xlarge-plus
4040

41-
container:
42-
image: vllm/vllm-openai:latest
43-
options: --ipc host --gpus all --entrypoint /bin/bash
44-
4541
steps:
4642
- name: Checkout
4743
uses: actions/checkout@v4
@@ -71,10 +67,6 @@ jobs:
7167
runs-on:
7268
group: aws-g5-12xlarge-plus
7369

74-
container:
75-
image: vllm/vllm-openai:latest
76-
options: --ipc host --gpus all --entrypoint /bin/bash
77-
7870
steps:
7971
- name: Checkout
8072
uses: actions/checkout@v4

Makefile

Lines changed: 16 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -292,21 +292,19 @@ test-cli-cuda-py-txi:
292292
uv sync --dev --extra py-txi
293293
FORCE_SEQUENTIAL=1 uv run pytest tests/test_cli.py -s -k "cli and cuda and (tgi or tei or txi)"
294294

295+
test-cli-cuda-vllm-single:
296+
uv sync --dev --extra vllm
297+
FORCE_SEQUENTIAL=1 uv run pytest tests/test_cli.py -s -k "cli and cuda and vllm and not (tp or pp)"
298+
299+
test-cli-cuda-vllm-multi:
300+
uv sync --dev --extra vllm
301+
FORCE_SEQUENTIAL=1 uv run pytest tests/test_cli.py -s -k "cli and cuda and vllm and (tp or pp)"
302+
295303
test-cli-cuda-onnxruntime:
296304
uv sync --dev --extra onnxruntime-gpu
297305
uv run pytest tests/test_cli.py -s -k "cli and cuda and onnxruntime"
298306

299307
#### non-uv compatible
300-
test-cli-cuda-vllm-single:
301-
pip install uv --upgrade
302-
UV_SYSTEM_PYTHON=1 uv pip install -e .[dev,vllm]
303-
FORCE_SEQUENTIAL=1 pytest tests/test_cli.py -s -k "cli and cuda and vllm and not (tp or pp)"
304-
305-
test-cli-cuda-vllm-multi:
306-
pip install uv --upgrade
307-
UV_SYSTEM_PYTHON=1 uv pip install -e .[dev,vllm]
308-
FORCE_SEQUENTIAL=1 pytest tests/test_cli.py -s -k "cli and cuda and vllm and (tp or pp)"
309-
310308
test-cli-cuda-tensorrt-llm-single:
311309
UV_SYSTEM_PYTHON=1 uv pip install -e .[dev,tensorrt-llm]
312310
FORCE_SEQUENTIAL=1 pytest tests/test_cli.py -s -k "cli and cuda and tensorrt_llm and not (tp or pp)"
@@ -328,21 +326,19 @@ test-cli-cuda-py-txi-examples:
328326
uv sync --dev --extra py-txi
329327
FORCE_SEQUENTIAL=1 uv run pytest tests/test_examples.py -s -k "cli and cuda and (tgi or tei or txi)"
330328

329+
test-cli-cuda-vllm-single-examples:
330+
uv sync --dev --extra vllm
331+
FORCE_SEQUENTIAL=1 uv run pytest tests/test_examples.py -s -k "cli and cuda and vllm and not (tp or pp)"
332+
333+
test-cli-cuda-vllm-multi-examples:
334+
uv sync --dev --extra vllm
335+
FORCE_SEQUENTIAL=1 uv run pytest tests/test_examples.py -s -k "cli and cuda and vllm and (tp or pp)"
336+
331337
test-cli-cuda-onnxruntime-examples:
332338
uv sync --dev --extra onnxruntime-gpu
333339
uv run pytest tests/test_examples.py -s -k "cli and cuda and onnxruntime"
334340

335341
#### non-uv compatible
336-
test-cli-cuda-vllm-single-examples:
337-
pip install uv --upgrade
338-
UV_SYSTEM_PYTHON=1 uv pip install -e .[dev,vllm]
339-
FORCE_SEQUENTIAL=1 pytest tests/test_examples.py -s -k "cli and cuda and vllm and not (tp or pp)"
340-
341-
test-cli-cuda-vllm-multi-examples:
342-
pip install uv --upgrade
343-
UV_SYSTEM_PYTHON=1 uv pip install -e .[dev,vllm]
344-
FORCE_SEQUENTIAL=1 pytest tests/test_examples.py -s -k "cli and cuda and vllm and (tp or pp)"
345-
346342
test-cli-cuda-tensorrt-llm-single-examples:
347343
pip install uv --upgrade
348344
UV_SYSTEM_PYTHON=1 uv pip install -e .[dev,tensorrt-llm]

pyproject.toml

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -100,11 +100,9 @@ onnxruntime-gpu = ["optimum[onnxruntime-gpu]>=1.27.0"]
100100
tensorrt-llm = [
101101
"huggingface-hub<0.26.0; extra != 'openvino' and extra != 'onnxruntime' and extra != 'onnxruntime-gpu' and extra != 'ipex' and extra != 'vllm' and extra != 'llama-cpp' and extra != 'py-txi'",
102102
]
103-
vllm = [
104-
"vllm; extra != 'openvino' and extra != 'onnxruntime' and extra != 'onnxruntime-gpu' and extra != 'ipex' and extra != 'tensorrt-llm' and extra != 'llama-cpp' and extra != 'py-txi'",
105-
]
106103
llama-cpp = ["llama-cpp-python"]
107104
py-txi = ["py-txi"]
105+
vllm = ["vllm"]
108106
# optional dependencies
109107
sentence-transformers = ["sentence-transformers"]
110108
gptqmodel = ["gptqmodel", "optimum"]

0 commit comments

Comments
 (0)