Skip to content

Commit 10bdded

Browse files
Hardcoded Triton Runtime Image in Triton testsuite (#853)
* Hardcoded triton image * fixed ns name * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Update TRITON_IMAGE version to 24.10-py3 * Changed image version * added smoke marker --------- Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
1 parent a681def commit 10bdded

File tree

4 files changed

+10
-3
lines changed

4 files changed

+10
-3
lines changed

tests/conftest.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -312,10 +312,12 @@ def mlserver_runtime_image(pytestconfig: pytest.Config) -> str | None:
312312

313313

314314
@pytest.fixture(scope="session")
315-
def triton_runtime_image(pytestconfig: pytest.Config) -> str | None:
315+
def triton_runtime_image(pytestconfig: pytest.Config) -> str:
316+
from tests.model_serving.model_runtime.triton.constant import TRITON_IMAGE
317+
316318
runtime_image = pytestconfig.option.triton_runtime_image
317319
if not runtime_image:
318-
return None
320+
return TRITON_IMAGE
319321
return runtime_image
320322

321323

tests/model_serving/model_runtime/triton/basic_model_deployment/test_pytorch_model.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,7 @@
3131
)
3232

3333

34+
@pytest.mark.sanity
3435
@pytest.mark.parametrize(
3536
("protocol", "model_namespace", "s3_models_storage_uri", "triton_serving_runtime", "triton_inference_service"),
3637
[

tests/model_serving/model_runtime/triton/constant.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -30,6 +30,10 @@
3030
TRITON_REST_PORT: int = 8080
3131
TRITON_GRPC_PORT: int = 9000
3232

33+
34+
TRITON_IMAGE: str = "nvcr.io/nvidia/tritonserver:24.10-py3"
35+
36+
3337
MODEL_PATH_PREFIX_KERAS: str = "triton_resnet/model_repository"
3438
MODEL_PATH_PREFIX: str = "triton/model_repository"
3539
MODEL_PATH_PREFIX_DALI: str = "triton_gpu/model_repository"

tests/model_serving/model_runtime/vllm/basic_model_deployment/test_granite_2b_instruct_preview_4k_r240917a.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515
"model_namespace, s3_models_storage_uri, serving_runtime, vllm_inference_service",
1616
[
1717
pytest.param(
18-
{"name": "granite-serverless-raw"},
18+
{"name": "granite-raw"},
1919
{"model-dir": "granite-2b-instruct-preview-4k-r240917a"},
2020
{"deployment_type": KServeDeploymentType.RAW_DEPLOYMENT},
2121
{

0 commit comments

Comments
 (0)