44
55from __future__ import annotations
66
7- from collections .abc import Mapping
87from datetime import datetime
98from decimal import Decimal
109from typing import Any
6160 "AccessTokenOrder" ,
6261 "ActivateDeploymentInput" ,
6362 "ActivateRevisionInput" ,
64- "AddRevisionGQLInputDTO" ,
6563 "AddRevisionInput" ,
6664 "AdminSearchDeploymentsInput" ,
6765 "AdminSearchRevisionsInput" ,
6866 "AutoScalingRuleFilter" ,
6967 "AutoScalingRuleOrder" ,
7068 "BlueGreenConfigInput" ,
7169 "ClusterConfigInput" ,
72- "CreateRevisionInputDTO " ,
70+ "CreateRevisionInput " ,
7371 "CreateAccessTokenInput" ,
7472 "CreateAutoScalingRuleInput" ,
7573 "CreateDeploymentInput" ,
10199 "ResourceSlotEntryInput" ,
102100 "ResourceSlotInput" ,
103101 "RevisionFilter" ,
104- "RevisionInput" ,
105102 "RevisionOrder" ,
106103 "ReplaceDeploymentOptionsGQLInput" ,
107104 "ReplaceDeploymentOptionsInput" ,
@@ -257,9 +254,6 @@ class ModelRuntimeConfigInput(BaseRequestModel):
257254 " RuntimeVariant resolver service before invoking internal flows."
258255 ),
259256 )
260- inference_runtime_config : dict [str , Any ] | None = Field (
261- default = None , description = "Framework-specific inference runtime configuration"
262- )
263257 environ : EnvironmentVariablesInput | None = Field (
264258 default = None , description = "Environment variables for the service"
265259 )
@@ -295,10 +289,9 @@ class ExtraVFolderMountInput(BaseRequestModel):
295289 )
296290
297291
298- class CreateRevisionInputDTO (BaseRequestModel ):
292+ class CreateRevisionInput (BaseRequestModel ):
299293 """Input for a deployment revision (nested structure matching GQL CreateRevisionInput)."""
300294
301- name : str | None = Field (default = None , description = "Revision name" )
302295 revision_preset_id : DeploymentPresetID | None = Field (
303296 default = None ,
304297 description = "DeploymentRevisionPreset ID. When specified, preset values are used as defaults and can be overridden by explicitly provided fields." ,
@@ -330,19 +323,24 @@ class AddRevisionOptions(BaseRequestModel):
330323 )
331324
332325
333- class AddRevisionGQLInputDTO (BaseRequestModel ):
326+ class AddRevisionInput (BaseRequestModel ):
334327 """Input for adding a revision. Used by both GQL and REST v2 APIs."""
335328
336- name : str | None = Field (default = None , description = "Revision name" )
337329 revision_preset_id : DeploymentPresetID | None = Field (
338330 default = None ,
339331 description = "DeploymentRevisionPreset ID. When specified, preset values are used as defaults and can be overridden by explicitly provided fields." ,
340332 )
341333 deployment_id : UUID = Field (description = "Deployment ID" )
342- cluster_config : ClusterConfigInput = Field (description = "Cluster configuration" )
343- resource_config : ResourceConfigInput = Field (description = "Resource configuration" )
344- image : ImageInput = Field (description = "Container image" )
345- model_runtime_config : ModelRuntimeConfigInput = Field (description = "Runtime configuration" )
334+ cluster_config : ClusterConfigInput | None = Field (
335+ default = None , description = "Cluster configuration"
336+ )
337+ resource_config : ResourceConfigInput | None = Field (
338+ default = None , description = "Resource configuration"
339+ )
340+ image : ImageInput | None = Field (default = None , description = "Container image" )
341+ model_runtime_config : ModelRuntimeConfigInput | None = Field (
342+ default = None , description = "Runtime configuration"
343+ )
346344 model_mount_config : ModelMountConfigInput = Field (description = "Model mount configuration" )
347345 model_definition : ModelDefinitionInput | None = Field (
348346 default = None ,
@@ -447,40 +445,6 @@ class DeploymentStrategyInput(BaseRequestModel):
447445 )
448446
449447
450- class RevisionInput (BaseRequestModel ):
451- """Input for a deployment revision."""
452-
453- name : str | None = Field (default = None , description = "Revision name" )
454- revision_preset_id : DeploymentPresetID | None = Field (
455- default = None ,
456- description = "DeploymentRevisionPreset ID. When specified, preset values are used as defaults and can be overridden by explicitly provided fields." ,
457- )
458- image_id : UUID = Field (description = "Container image ID" )
459- cluster_mode : ClusterMode = Field (description = "Cluster mode for the revision" )
460- cluster_size : int = Field (default = 1 , ge = 1 , description = "Number of nodes in the cluster" )
461- resource_slots : Mapping [str , Any ] = Field (description = "Resource slot requirements" )
462- resource_opts : Mapping [str , Any ] | None = Field (
463- default = None , description = "Optional resource options"
464- )
465- runtime_variant_id : RuntimeVariantID = Field (description = "Runtime variant ID (UUID)" )
466- inference_runtime_config : dict [str , Any ] | None = Field (
467- default = None , description = "Framework-specific inference runtime configuration"
468- )
469- model_vfolder_id : VFolderUUID = Field (description = "Model VFolder ID" )
470- model_mount_destination : str = Field (
471- default = "/models" , description = "Mount destination for model vfolder"
472- )
473- model_definition_path : str = Field (description = "Path to model definition file" )
474- model_definition : ModelDefinitionInput | None = Field (
475- default = None ,
476- description = "Model definition to override the default values generated by the server" ,
477- )
478- extra_mounts : list [ExtraVFolderMountInput ] | None = Field (
479- default = None , description = "Additional vfolder mounts"
480- )
481- environ : Mapping [str , str ] | None = Field (default = None , description = "Environment variables" )
482-
483-
484448class CreateDeploymentInput (BaseRequestModel ):
485449 """Input for creating a deployment."""
486450
@@ -492,7 +456,7 @@ class CreateDeploymentInput(BaseRequestModel):
492456 description = "Deployment strategy configuration"
493457 )
494458 replica_count : int = Field (ge = 0 , description = "Number of replicas" )
495- initial_revision : CreateRevisionInputDTO | None = Field (
459+ initial_revision : CreateRevisionInput | None = Field (
496460 default = None ,
497461 description = "Initial revision configuration. If omitted, deployment is created without a revision and must be added later via add_revision." ,
498462 )
@@ -546,13 +510,6 @@ class ScaleDeploymentInput(BaseRequestModel):
546510 replicas : int = Field (ge = 0 , description = "Target replica count" )
547511
548512
549- class AddRevisionInput (BaseRequestModel ):
550- """Input for adding a revision to a deployment."""
551-
552- deployment_id : UUID = Field (description = "Deployment ID" )
553- revision : RevisionInput = Field (description = "Revision configuration" )
554-
555-
556513# ---------------------------------------------------------------------------
557514# Filter types
558515# ---------------------------------------------------------------------------
0 commit comments