open-edge-platform · sairampillai · Sep 26, 2025 · Sep 28, 2025 · Sep 28, 2025 · Sep 29, 2025
diff --git a/metro-ai-suite/metro-vision-ai-app-recipe/benchmark_start.sh b/metro-ai-suite/metro-vision-ai-app-recipe/benchmark_start.sh
@@ -164,8 +164,16 @@ services:
       - scenescape
     privileged: true
     entrypoint: ["./run.sh"]
+    group_add:
+      - "109"
+      - "110"
+      - "992"
+    device_cgroup_rules:
+      - 'c 189:* rmw'
+      - 'c 209:* rmw'
+      - 'a 189:* rwm'
     devices:
-      - "/dev/dri:/dev/dri"
+      - "/dev:/dev"
     depends_on:
       - broker
       - ntpserver

diff --git a/metro-ai-suite/metro-vision-ai-app-recipe/loitering-detection/benchmark_app_payload.json b/metro-ai-suite/metro-vision-ai-app-recipe/loitering-detection/benchmark_app_payload.json
@@ -0,0 +1,80 @@
+[
+    {
+        "pipeline": "object_tracking_cpu",
+        "payload":{
+            "source": {
+                "uri": "file:///home/pipeline-server/videos/VIRAT_S_000101_looped.mp4",
+                "type": "uri"
+            },
+            "destination": {
+                "metadata": {
+                    "type": "mqtt",
+                    "topic": "object_tracking_$x",
+                    "publish_frame":false
+                },
+                "frame": {
+                    "type": "webrtc",
+                    "peer-id": "object_tracking_$x"
+                }
+            },
+            "parameters": {
+                "detection-properties": {
+                    "model": "/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml",
+                    "device": "CPU"
+                }
+            }
+        }
+    },
+    {
+        "pipeline": "object_tracking_gpu",
+        "payload":{
+            "source": {
+                "uri": "file:///home/pipeline-server/videos/VIRAT_S_000101_looped.mp4",
+                "type": "uri"
+            },
+            "destination": {
+                "metadata": {
+                    "type": "mqtt",
+                    "topic": "object_tracking_$x",
+                    "publish_frame":false
+                },
+                "frame": {
+                    "type": "webrtc",
+                    "peer-id": "object_tracking_$x"
+                }
+            },
+            "parameters": {
+                "detection-properties": {
+                    "model": "/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml",
+                    "device": "GPU"
+                }
+            }
+        }
+    },
+    {
+        "pipeline": "object_tracking_npu",
+        "payload":{
+            "source": {
+                "uri": "file:///home/pipeline-server/videos/VIRAT_S_000101_looped.mp4",
+                "type": "uri"
+            },
+            "destination": {
+                "metadata": {
+                    "type": "mqtt",
+                    "topic": "object_tracking_$x",
+                    "publish_frame":false
+                },
+                "frame": {
+                    "type": "webrtc",
+                    "peer-id": "object_tracking_$x"
+                }
+            },
+            "parameters": {
+                "detection-properties": {
+                    "model": "/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml",
+                    "device": "NPU"
+                }
+            }
+        }
+    }
+]
diff --git a/...ro-vision-ai-app-recipe/loitering-detection/docs/user-guide/how-to-benchmark.md b/...ro-vision-ai-app-recipe/loitering-detection/docs/user-guide/how-to-benchmark.md
@@ -0,0 +1,140 @@
+# How to Benchmark Performance
+
+This document provides instructions on how to run performance benchmarks for the Vision AI applications using the provided benchmarking scripts. The script determines the maximum number of concurrent video streams a system can process (stream density) while maintaining a target performance level.
+
+## Prerequisites
+
+- The `edge-ai-suites` repository must be cloned to your system.
+
+## Step 1: Understand the Benchmarking Script
+
+The core of the benchmarking process is the `benchmark_start.sh` script, located in the `metro-vision-ai-app-recipe/` directory. This script automates the process of starting video streams, monitoring their performance (Frames Per Second - FPS), and calculating key performance indicators (KPIs) to find the maximum sustainable stream density.
+
+### Stream Density Logic
+
+The script uses a binary search algorithm to efficiently find the optimal stream count within a given range (`lower_bound` and `upper_bound`). Here is a summary of the logic from the `benchmark_start.sh` script:
+
+1.  **Initialization:** The script starts with a lower bound (`lns`) and an upper bound (`uns`) for the number of streams. The current number of streams to test (`ns`) is initialized to the lower bound. A variable (`tns`) tracks the highest successful stream count found so far.
+
+2.  **Binary Search Loop:** The script iterates until the range between the lower and upper bounds is 1, and both bounds have been tested. In each iteration:
+    *   It runs a workload with the current number of streams (`ns`).
+    *   It measures the `throughput min` (the lowest FPS achieved among all streams) and compares it to the `target_fps`.
+
+3.  **Adjusting the Range:**
+    *   **If Performance Target is NOT Met** (`throughput min` < `target_fps`): The current stream count (`ns`) is too high. It becomes the new upper bound (`uns = ns`). The next stream count to test is calculated as the midpoint between the old lower bound and this new upper bound.
+    *   **If Performance Target is Met** (`throughput min` >= `target_fps`): The system can handle this workload. The current stream count (`ns`) becomes the new lower bound (`lns = ns`), and the highest successful stream count (`tns`) is updated. The next stream count to test is calculated as the midpoint between this new lower bound and the old upper bound.
+
+4.  **Convergence:** This process of testing midpoints and narrowing the search range continues until the loop condition is met. The final value of `tns` represents the highest number of streams that successfully met the performance target, which is reported as the final stream density.
+
+### Average FPS Calculation
+
+During each test run, the script logs the `avg_fps` for every active pipeline instance at regular intervals. At the end of the run, an `awk` script processes these logs to calculate several KPIs for the collection of FPS samples from each stream:
+
+-   **Percentile Throughput:** Calculates a specific percentile (e.g., 90th) of the FPS values to ignore outliers.
+-   **Average Throughput:** The mean FPS across all streams.
+-   **Median Throughput:** The median FPS value.
+-   **Cumulative Throughput:** The sum of the FPS from all streams.
+-   **Min Throughput:** The lowest (worst-case) FPS achieved among all streams. This value is critical for the stream density calculation.
+
+## Step 2: Prepare for Benchmarking
+
+1.  **Set Up and Start the Application:** Before running the benchmark, you must set up and start the desired application (e.g., Loitering Detection). This ensures all services, including the DL Streamer Pipeline Server, are running and available. For setup instructions, please refer to the `get-started.md` guide located in the specific application's documentation folder (e.g., `loitering-detection/docs/user-guide/`).
+
+2.  **Navigate to Script Directory:** Open a terminal and navigate to the `metro-vision-ai-app-recipe` directory.
+
+    ```bash
+    cd edge-ai-suites/metro-ai-suite/metro-vision-ai-app-recipe/
+    ```
+
+3.  **Stop Existing Pipelines:** Ensure no other pipelines are running before you start the benchmark. You can stop any running pipelines with the `sample_stop.sh` script.
+
+    ```bash
+    ./sample_stop.sh
+    ```
+
+## Step 3: Run the Benchmark
+
+The `benchmark_start.sh` script requires a pipeline name and stream count boundaries to run. The available pipelines are defined in the `benchmark_app_payload.json` file located within each application's directory (e.g., `loitering-detection/`).
+
+<details>
+<summary>Example Payload with Detection and Classification</summary>
+
+The `benchmark_app_payload.json` file contains an array of pipeline configurations. Each configuration specifies the pipeline name and a payload with parameters for source, destination, and AI models. The script uses the pipeline name to select the corresponding payload for benchmarking.
+
+Here is an example of a GPU pipeline configuration that includes both `detection-properties` and `classification-properties` with additional parameters:
+
+```json
+{
+    "pipeline": "object_tracking_gpu",
+    "payload": {
+        "source": {
+            "uri": "file:///home/pipeline-server/videos/VIRAT_S_000101_looped.mp4",
+            "type": "uri"
+        },
+        "destination": {
+            "metadata": {
+                "type": "mqtt",
+                "topic": "object_detection_$x",
+                "publish_frame": false
+            },
+            "frame": {
+                "type": "webrtc",
+                "peer-id": "object_detection_$x"
+            }
+        },
+        "parameters": {
+            "detection-properties": {
+                "model": "/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml",
+                "device": "GPU",
+                "inference-interval": 3,
+                "inference-region": 0,
+                "batch-size": 8,
+                "nireq": 2,
+                "ie-config": "NUM_STREAMS=2",
+                "pre-process-backend": "va-surface-sharing",
+                "threshold": 0.7
+            }
+        }
+    }
+}
+```
+</details>
+
+### Example: Running Stream Density Benchmark for Loitering Detection
+
+This example will find the maximum number of loitering detection streams that can run on the CPU while maintaining at least 15 FPS.
+
+1.  Execute the `benchmark_start.sh` script, providing the desired pipeline name (`object_tracking_cpu` in this case). Here, we test a range of 1 to 16 streams.
+
+    ```bash
+    # Usage: ./benchmark_start.sh -p <pipeline_name> -l <lower_bound> -u <upper_bound> -t <target_fps>
+
+    ./benchmark_start.sh -p object_tracking_cpu -l 1 -u 16 -t 15
+    ```
+
+2.  The script will output its progress as it tests different stream counts. The final output will show the optimal stream density found.
+
+    ```text
+    ✅ FINAL RESULT: Stream-Density Benchmark Completed!
+    stream density: 8
+    ======================================================
+
+    KPIs for the optimal configuration (8 streams):
+    throughput #1: 29.98
+    throughput #2: 29.98
+    ...
+    throughput #8: 29.98
+    throughput median: 29.98
+    throughput average: 29.98
+    throughput stdev: 0
+    throughput cumulative: 239.84
+    throughput min: 29.98
+    ```
+
+## Step 4: Stop the Benchmark
+
+After the benchmark is complete, or if you need to stop it manually, use the `sample_stop.sh` script. This will delete all running pipeline instances.
+
+```bash
+./sample_stop.sh
+```
diff --git a/...-app-recipe/loitering-detection/docs/user-guide/how-to-use-cpu-for-inference.md b/...-app-recipe/loitering-detection/docs/user-guide/how-to-use-cpu-for-inference.md
@@ -1,15 +1,14 @@
 # How to use CPU for inference
 
 ## CPU specific element properties
-
 DL Streamer inference elements also provides property such as `device=CPU` and `pre-process-backend=opencv` to infer and pre-process on CPU. Read DL Streamer [docs](https://dlstreamer.github.io/dev_guide/model_preparation.html#model-pre-and-post-processing) for more.
 
-## Tutorial on how to use CPU specific pipelines
+### Tutorial on how to use CPU specific pipelines
 
 The pipeline `object_tracking_cpu` in [pipeline-server-config](../../src/dlstreamer-pipeline-server/config.json) contains CPU specific elements and uses CPU backend for inferencing. We can start the pipeline as follows:
 
 ```sh
 ./sample_start.sh cpu
 ```
 
-Go to grafana as explained in [get-started](./get-started.md) to view the dashboard.
+Go to grafana as explained in [get-started](./get-started.md) to view the dashboard.
diff --git a/...-suite/metro-vision-ai-app-recipe/loitering-detection/docs/user-guide/index.rst b/...-suite/metro-vision-ai-app-recipe/loitering-detection/docs/user-guide/index.rst
@@ -20,6 +20,7 @@ By utilizing cutting-edge technologies and pre-trained deep learning models, thi
    how-to-customize-application
    how-to-deploy-with-helm
    how-to-deploy-with-edge-orchestrator
+   how-to-benchmark
    how-to-view-telemetry-data
    how-to-use-gpu-for-inference
    how-to-use-cpu-for-inference

diff --git a/...i-app-recipe/loitering-detection/helm-chart/config/dlstreamer-pipeline-server/config.json b/...i-app-recipe/loitering-detection/helm-chart/config/dlstreamer-pipeline-server/config.json
@@ -60,4 +60,4 @@
             }
         ]
     }
-}
+}
diff --git a/...metro-vision-ai-app-recipe/loitering-detection/src/dlstreamer-pipeline-server/config.json b/...metro-vision-ai-app-recipe/loitering-detection/src/dlstreamer-pipeline-server/config.json
@@ -5,7 +5,7 @@
                 "name": "object_tracking_cpu",
                 "source": "gstreamer",
                 "queue_maxsize": 50,
-                "pipeline": "{auto_source} name=source  ! decodebin force-sw-decoders=true ! gvaattachroi roi=0,200,300,400 ! gvadetect inference-region=1 model=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml model_proc=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/pedestrian-and-vehicle-detector-adas-0001.json device=CPU pre-process-backend=opencv model-instance-id=inst0 name=detection ! queue ! gvatrack tracking-type=short-term-imageless ! queue ! gvametaconvert add-empty-results=true name=metaconvert ! queue ! gvafpscounter ! appsink name=destination",
+                "pipeline": "{auto_source} name=source  ! decodebin force-sw-decoders=true ! gvaattachroi roi=0,200,300,400 ! gvadetect inference-region=1 model=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml model_proc=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/pedestrian-and-vehicle-detector-adas-0001.json device=CPU pre-process-backend=opencv model-instance-id=inst0 inference-interval=3 threshold=0.7 name=detection ! queue ! gvatrack tracking-type=short-term-imageless ! queue ! gvametaconvert add-empty-results=true name=metaconvert ! queue ! gvafpscounter ! appsink name=destination",
                 "description": "Object detection with yolov8",
                 "parameters": {
                     "type": "object",
@@ -18,13 +18,14 @@
                         }
                     }
                 },
+
                 "auto_start": false
             },
             {
                 "name": "object_tracking_gpu",
                 "source": "gstreamer",
                 "queue_maxsize": 50,
-                "pipeline": "{auto_source} name=source  ! parsebin ! vah264dec ! vapostproc ! video/x-raw(memory:VAMemory) ! gvaattachroi roi=0,200,300,400 ! gvadetect inference-region=1 model=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml model_proc=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/pedestrian-and-vehicle-detector-adas-0001.json device=GPU pre-process-backend=va-surface-sharing model-instance-id=instgpu0 name=detection ! queue ! gvatrack tracking-type=short-term-imageless ! queue ! gvametaconvert add-empty-results=true name=metaconvert ! queue ! gvafpscounter ! appsink name=destination",
+                "pipeline": "{auto_source} name=source  ! parsebin ! vah264dec ! vapostproc ! video/x-raw(memory:VAMemory) ! gvaattachroi roi=0,200,300,400 ! gvadetect inference-region=1 inference-interval=3 batch-size=8 nireq=2 ie-config=\"NUM_STREAMS=2\" threshold=0.7 model=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml model_proc=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/pedestrian-and-vehicle-detector-adas-0001.json device=GPU pre-process-backend=va-surface-sharing model-instance-id=instgpu0 name=detection ! queue ! gvatrack tracking-type=short-term-imageless ! queue ! gvametaconvert add-empty-results=true name=metaconvert ! queue ! gvafpscounter ! appsink name=destination",
                 "description": "Object detection with yolov8",
                 "parameters": {
                     "type": "object",
@@ -43,7 +44,7 @@
                 "name": "object_tracking_npu",
                 "source": "gstreamer",
                 "queue_maxsize": 50,
-                "pipeline": "{auto_source} name=source  ! parsebin ! vah264dec ! vapostproc ! video/x-raw(memory:VAMemory) ! gvaattachroi roi=0,200,300,400 ! gvadetect inference-region=1 model=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml model_proc=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/pedestrian-and-vehicle-detector-adas-0001.json device=NPU pre-process-backend=va model-instance-id=instnpu0 name=detection ! queue ! gvatrack tracking-type=short-term-imageless ! queue ! gvametaconvert add-empty-results=true name=metaconvert ! queue ! gvafpscounter ! appsink name=destination",
+                "pipeline": "{auto_source} name=source  ! parsebin ! vah264dec ! vapostproc ! video/x-raw(memory:VAMemory) ! gvaattachroi roi=0,200,300,400 ! gvadetect inference-region=1 inference-interval=3 batch-size=1 nireq=4 threshold=0.7 model=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml model_proc=/home/pipeline-server/models/intel/pedestrian-and-vehicle-detector-adas-0001/pedestrian-and-vehicle-detector-adas-0001.json device=NPU pre-process-backend=va model-instance-id=instnpu0 name=detection ! queue ! gvatrack tracking-type=short-term-imageless ! queue ! gvametaconvert add-empty-results=true name=metaconvert ! queue ! gvafpscounter ! appsink name=destination",
                 "description": "Object detection with yolov8",
                 "parameters": {
                     "type": "object",
-Original file line number
+Diff line change
@@ Expand Up / @@ -60,4 +60,4 @@ @@
                 }
             ]
         }
-    }
+    }