Skip to content

Commit ec69c25

Browse files
author
YourUsername
committed
fix served_model_name
1 parent 41cbb43 commit ec69c25

File tree

2 files changed

+6
-2
lines changed

2 files changed

+6
-2
lines changed

matrix/app_server/app_api.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -341,6 +341,7 @@ def get_app_metadata(
341341

342342
prefix = app["route_prefix"].strip("/") # type: ignore
343343
model = app["args"].get("model") # type: ignore
344+
served_model_name = app["args"].get("served_model_name") # type: ignore
344345
deployment_name = app["deployments"][0]["name"] # type: ignore
345346
use_grpc = "GrpcDeployment" in deployment_name
346347

@@ -368,7 +369,7 @@ def get_app_metadata(
368369
"http_port": http_port,
369370
"grpc_port": grpc_port,
370371
"route_prefix": prefix,
371-
"model_name": model,
372+
"model_name": served_model_name if served_model_name else model,
372373
"deployment_name": deployment_name,
373374
"use_grpc": use_grpc,
374375
"endpoint_template": endpoint_template,

matrix/app_server/llm/ray_serve_vllm.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -209,7 +209,10 @@ def create_openai(
209209
"response_role": self.response_role,
210210
}
211211
if self.engine_args.served_model_name is not None:
212-
base_model_paths = self.engine_args.served_model_name
212+
base_model_paths = [
213+
BaseModelPath(name=name, model_path=self.engine_args.model)
214+
for name in self.engine_args.served_model_name
215+
]
213216
else:
214217
if has_base_model_path:
215218
base_model_paths = [

0 commit comments

Comments
 (0)