NVIDIA · visheshtanksale · May 30, 2025 · May 30, 2025 · May 30, 2025 · May 30, 2025
@@ -127,7 +127,7 @@ type ModelSpec struct {
 	Profiles []string `json:"profiles,omitempty"`
 	// Precision is the precision for model quantization
 	Precision string `json:"precision,omitempty"`
-	// Engine is the backend engine (tensort_llm, vllm)
+	// Engine is the backend engine (tensorrt_llm, vllm)
 	Engine string `json:"engine,omitempty"`
 	// TensorParallelism is the minimum GPUs required for the model computations
 	TensorParallelism string `json:"tensorParallelism,omitempty"`

@@ -344,7 +344,7 @@ spec:
                               GPUs
                             type: boolean
                           engine:
-                            description: Engine is the backend engine (tensort_llm,
+                            description: Engine is the backend engine (tensorrt_llm,
                               vllm)
                             type: string
                           gpus:

@@ -344,7 +344,7 @@ spec:
                               GPUs
                             type: boolean
                           engine:
-                            description: Engine is the backend engine (tensort_llm,
+                            description: Engine is the backend engine (tensorrt_llm,
                               vllm)
                             type: string
                           gpus:

@@ -344,7 +344,7 @@ spec:
                               GPUs
                             type: boolean
                           engine:
-                            description: Engine is the backend engine (tensort_llm,
+                            description: Engine is the backend engine (tensorrt_llm,
                               vllm)
                             type: string
                           gpus:

@@ -80,10 +80,22 @@ func (manifest NIMManifest) MatchProfiles(modelSpec appsv1alpha1.ModelSpec, disc
 
 		// Determine backend type
 		backend := profile.Tags["llm_engine"]
+
+		// Use "model_type" if "llm_engine" is empty for non LLM models
+		if backend == "" {
+			backend = profile.Tags["model_type"]
+		}
+
+		// Fallback to deprecated "backend" tag for non LLM Models
 		if backend == "" {
 			backend = profile.Tags["backend"]
 		}
 
+		// modespec.Engine value can be "tensorrt_llm". If backend tag is "triton", convert it to "tensorrt".
+		if backend == "triton" {
+			backend = "tensorrt"
+		}
+
 		if modelSpec.Engine != "" && !strings.Contains(backend, strings.TrimSuffix(modelSpec.Engine, "_llm")) {
 			continue
 		}