Skip to content

Commit a2595fd

Browse files
authored
allow create Ray cluster with reduced dependency (#125)
* add verl as dependency * lazy import
1 parent a0252c1 commit a2595fd

File tree

2 files changed

+15
-3
lines changed

2 files changed

+15
-3
lines changed

matrix/app_server/deploy_utils.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -416,9 +416,6 @@ def get_yaml_for_deployment(
416416
):
417417
"""deploy helper function.
418418
Return modified applications and yaml for deployment"""
419-
from vllm.engine.arg_utils import AsyncEngineArgs
420-
421-
from matrix.app_server.llm.ray_serve_vllm import BaseDeployment
422419

423420
temp_dir = cluster_info.temp_dir
424421
cache_dir = setup_native_cache_dirs()
@@ -463,6 +460,10 @@ def get_yaml_for_deployment(
463460
app["max_replica"] = app["min_replica"]
464461

465462
if app_type in ["llm", "sglang_llm", "fastgen"]:
463+
from vllm.engine.arg_utils import AsyncEngineArgs
464+
465+
from matrix.app_server.llm.ray_serve_vllm import BaseDeployment
466+
466467
unknown = {
467468
k: v
468469
for k, v in app.items()

pyproject.toml

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -162,6 +162,17 @@ classifiers=[
162162
"iopath",
163163
"jsonlines",
164164
]
165+
ray = [
166+
"submitit>=1.5.2",
167+
"ray[default,serve]>=2.48.0",
168+
"boto3",
169+
"google-genai>=1.13.0",
170+
"datasketch",
171+
"s3fs",
172+
"datasets",
173+
"iopath",
174+
"jsonlines",
175+
]
165176
# For video processing
166177
vision = [
167178
"submitit>=1.5.2",

0 commit comments

Comments
 (0)