fix typo on inferenceservice-config (kserve#4244)

spolti · web-flow · commit b4ddbd8c3604 · 2025-04-04T14:18:26.000+05:30
Signed-off-by: Filippe Spolti &lt;fspolti@redhat.com&gt;
Signed-off-by: Spolti &lt;fspolti@redhat.com&gt;
diff --git a/charts/kserve-resources/templates/configmap.yaml b/charts/kserve-resources/templates/configmap.yaml
@@ -42,7 +42,69 @@ data:
                 "defaultImageVersion": "latest"
             }
         }
+    # ====================================== ISVC CONFIGURATION ======================================
+    # Example - setting custom annotation
+     inferenceService: |-
+       {
+         "serviceAnnotationDisallowedList": [
+            "my.custom.annotation/1"
+         ],
+         "serviceLabelDisallowedList": [
+            "my.custom.label.1"
+         ]
+       }
+    # Example - setting custom annotation
+    inferenceService: |-
+      {
+        # ServiceAnnotationDisallowedList is a list of annotations that are not allowed to be propagated to Knative
+        # revisions, which prevents the reconciliation loop to be triggered if the annotations is
+        # configured here are used.
+        # Default values are:
+        #  "autoscaling.knative.dev/min-scale",
+        #  "autoscaling.knative.dev/max-scale",
+        #  "internal.serving.kserve.io/storage-initializer-sourceuri",
+        #  "kubectl.kubernetes.io/last-applied-configuration"
+        # Any new value will be appended to the list.
+        "serviceAnnotationDisallowedList": [
+          "my.custom.annotation/1"
+        ],
+        # ServiceLabelDisallowedList is a list of labels that are not allowed to be propagated to Knative revisions
+        # which prevents the reconciliation loop to be triggered if the labels is configured here are used.
+        "serviceLabelDisallowedList": [
+          "my.custom.label.1"
+        ]
+      }
+    # Example - setting custom resource
+    inferenceService: |-
+      {
+        "resource": {
+          "cpuLimit": "1",
+          "memoryLimit": "2Gi",
+          "cpuRequest": "1",
+          "memoryRequest": "2Gi"
+        }
+      }
+    # Example - setting custom resource
+    inferenceService: |-
+      {
+        # resource contains the default resource configuration for the inference service.
+        # you can override this configuration by specifying the resources in the inference service yaml.
+        # If you want to unbound the resource (limits and requests), you can set the value to null or ""
+        # or just remove the specific field from the config.
+        "resource": {
+           # cpuLimit is the limits.cpu to set for the inference service.
+           "cpuLimit": "1",
+
+           # memoryLimit is the limits.memory to set for the inference service.
+           "memoryLimit": "2Gi",
+
+           # cpuRequest is the requests.cpu to set for the inference service.
+           "cpuRequest": "1",
 
+           # memoryRequest is the requests.memory to set for the inference service.
+           "memoryRequest": "2Gi"
+        }
+     }
      # ====================================== STORAGE INITIALIZER CONFIGURATION ======================================
      # Example
      storageInitializer: |-
@@ -629,3 +691,10 @@ data:
         "memoryRequest": "{{ .Values.kserve.inferenceservice.resources.requests.memory }}"
       }
     }
+
+  opentelemetryCollector: |-
+    {
+      "scrapeInterval": "5s",
+      "metricReceiverEndpoint": "keda-otel-scaler.keda.svc:4317",
+      "metricScalerEndpoint": "keda-otel-scaler.keda.svc:4318"
+    }
diff --git a/config/configmap/inferenceservice.yaml b/config/configmap/inferenceservice.yaml
@@ -42,17 +42,17 @@ data:
            }
        }
     # ====================================== ISVC CONFIGURATION ======================================
-    # Example   
+    # Example - setting custom annotation  
      inferenceService: |-
-      {
-        "serviceAnnotationDisallowedList": [
-          "my.custom.annotation/1"  
-        ],
-        "serviceLabelDisallowedList": [
-          "my.custom.label.1"  
-        ]
+       {
+         "serviceAnnotationDisallowedList": [
+            "my.custom.annotation/1"  
+         ],
+         "serviceLabelDisallowedList": [
+            "my.custom.label.1"  
+         ]
        }
-    # Example of isvc configuration
+    # Example - setting custom annotation
     inferenceService: |-
       {
         # ServiceAnnotationDisallowedList is a list of annotations that are not allowed to be propagated to Knative 
@@ -72,7 +72,38 @@ data:
         "serviceLabelDisallowedList": [
           "my.custom.label.1"  
         ]
-      }  
+      } 
+    # Example - setting custom resource
+    inferenceService: |-
+      {
+        "resource": {
+          "cpuLimit": "1",
+          "memoryLimit": "2Gi",
+          "cpuRequest": "1",
+          "memoryRequest": "2Gi"
+        }
+      }
+    # Example - setting custom resource
+    inferenceService: |-
+      {
+        # resource contains the default resource configuration for the inference service.
+        # you can override this configuration by specifying the resources in the inference service yaml.
+        # If you want to unbound the resource (limits and requests), you can set the value to null or "" 
+        # or just remove the specific field from the config.
+        "resource": {
+           # cpuLimit is the limits.cpu to set for the inference service.
+           "cpuLimit": "1",
+    
+           # memoryLimit is the limits.memory to set for the inference service.
+           "memoryLimit": "2Gi",
+    
+           # cpuRequest is the requests.cpu to set for the inference service.
+           "cpuRequest": "1",
+    
+           # memoryRequest is the requests.memory to set for the inference service.
+           "memoryRequest": "2Gi"
+        }
+     }
     # ====================================== MultiNode CONFIGURATION ======================================
     # Example   
     multiNode: |-
@@ -566,38 +597,6 @@ data:
          # This is to disable localmodel pv and pvc management for namespaces without isvcs
          "disableVolumeManagement": false
        }
-      
-     # ====================================== LOCALMODEL CONFIGURATION ======================================
-     # Example
-     inferenceservice: |-
-       {
-         "resource": {
-             "cpuLimit": "1",
-             "memoryLimit": "2Gi",
-             "cpuRequest": "1",
-             "memoryRequest": "2Gi"
-           }
-       }
-      inferenceservice: |-
-        {
-          # resource contains the default resource configuration for the inference service.
-          # you can override this configuration by specifying the resources in the inference service yaml.
-          # If you want to unbound the resource (limits and requests), you can set the value to null or "" 
-          # or just remove the specific field from the config.
-          "resource": {
-              # cpuLimit is the limits.cpu to set for the inference service.
-              "cpuLimit": "1",
-              
-              # memoryLimit is the limits.memory to set for the inference service.
-              "memoryLimit": "2Gi",
-              
-              # cpuRequest is the requests.cpu to set for the inference service.
-              "cpuRequest": "1",
-              
-              # memoryRequest is the requests.memory to set for the inference service.
-              "memoryRequest": "2Gi"
-            }
-        }
 
   explainers: |-
     {