albumentations-team
diff --git a/‎README.md‎
Lines changed: 46 additions & 12 deletions b/‎README.md‎
Lines changed: 46 additions & 12 deletions
diff --git a/‎benchmark/cli.py‎
Lines changed: 38 additions & 1 deletion b/‎benchmark/cli.py‎
Lines changed: 38 additions & 1 deletion
diff --git a/‎benchmark/runner.py‎
Lines changed: 18 additions & 0 deletions b/‎benchmark/runner.py‎
Lines changed: 18 additions & 0 deletions
@@ -46,10 +46,6 @@ This benchmark suite measures the throughput and performance characteristics of
 
 The image benchmarks compare the performance of various libraries on standard image transformations. All benchmarks are run on a single CPU thread to ensure consistent and comparable results.
 
-[**Detailed Image Benchmark Results**](docs/images/README.md)
-
-![Image Speedup Analysis](docs/images/images_speedup_analysis.webp)
-
 <!-- IMAGE_BENCHMARK_TABLE_START -->
 | Transform            | albumentationsx 2.0.18 [img/s]   | kornia 0.8.2 [img/s]   | torchvision 0.25.0 [img/s]   | Speedup (albx/fastest other)   |
 |:---------------------|:---------------------------------|:-----------------------|:-----------------------------|:-------------------------------|
@@ -105,13 +101,55 @@ The image benchmarks compare the performance of various libraries on standard im
 | VerticalFlip         | **27128 ± 1197**                 | 2387 ± 58              | 26928 ± 4799                 | 1.01x                          |
 <!-- IMAGE_BENCHMARK_TABLE_END -->
 
-### Video Benchmarks
+### Multi-Channel Image Benchmarks (9ch)
 
-The video benchmarks compare CPU-based processing (AlbumentationsX) with GPU-accelerated processing (Kornia) for video transformations. The benchmarks use the [UCF101 dataset](https://www.crcv.ucf.edu/data/UCF101.php), which contains realistic videos from 101 action categories.
+Benchmarks on 9-channel images (3x stacked RGB) to test OpenCV chunking and library support for >4 channels.
+
+<!-- MULTICHANNEL_BENCHMARK_TABLE_START -->
+| Transform            | albumentationsx 2.0.18 [img/s]   | kornia 0.8.2 [img/s]   | torchvision 0.25.0 [img/s]   | Speedup (albx/fastest other)   |
+|:---------------------|:---------------------------------|:-----------------------|:-----------------------------|:-------------------------------|
+| Affine               | **640 ± 6**                      | 228 ± 3                | 143 ± 3                      | 2.81x                          |
+| AutoContrast         | **428 ± 8**                      | 374 ± 3                | -                            | 1.14x                          |
+| Blur                 | **2418 ± 154**                   | 186 ± 3                | -                            | 12.97x                         |
+| Brightness           | **3650 ± 162**                   | 1350 ± 40              | -                            | 2.70x                          |
+| CenterCrop128        | 51247 ± 435                      | -                      | **223574 ± 5049**            | 0.23x                          |
+| ChannelDropout       | **6387 ± 176**                   | 2179 ± 95              | -                            | 2.93x                          |
+| ChannelShuffle       | **2427 ± 164**                   | 929 ± 25               | 1600 ± 41                    | 1.52x                          |
+| Contrast             | **3837 ± 368**                   | 1346 ± 31              | -                            | 2.85x                          |
+| CornerIllumination   | **203 ± 2**                      | 181 ± 3                | -                            | 1.12x                          |
+| Erasing              | **9956 ± 359**                   | 426 ± 10               | 4321 ± 384                   | 2.30x                          |
+| GaussianBlur         | **746 ± 9**                      | 188 ± 2                | 49 ± 6                       | 3.97x                          |
+| GaussianIllumination | **240 ± 2**                      | 212 ± 15               | -                            | 1.13x                          |
+| GaussianNoise        | **95 ± 3**                       | 65 ± 0                 | -                            | 1.45x                          |
+| HorizontalFlip       | 2531 ± 234                       | 2286 ± 557             | **15102 ± 3640**             | 0.17x                          |
+| Invert               | 10141 ± 2159                     | 2774 ± 169             | **15806 ± 3070**             | 0.64x                          |
+| LinearIllumination   | 140 ± 1                          | **491 ± 12**           | -                            | 0.29x                          |
+| LongestMaxSize       | 350 ± 1                          | **376 ± 2**            | -                            | 0.93x                          |
+| MotionBlur           | **1443 ± 56**                    | 63 ± 1                 | -                            | 22.95x                         |
+| Normalize            | 387 ± 5                          | **1402 ± 64**          | 795 ± 22                     | 0.28x                          |
+| OpticalDistortion    | **457 ± 8**                      | 157 ± 4                | -                            | 2.91x                          |
+| Pad                  | 8358 ± 319                       | -                      | **9112 ± 704**               | 0.92x                          |
+| Perspective          | **579 ± 2**                      | 149 ± 1                | 129 ± 2                      | 3.90x                          |
+| PlasmaBrightness     | **83 ± 1**                       | 24 ± 1                 | -                            | 3.44x                          |
+| PlasmaContrast       | **68 ± 0**                       | 24 ± 1                 | -                            | 2.82x                          |
+| PlasmaShadow         | 125 ± 1                          | **224 ± 2**            | -                            | 0.56x                          |
+| Posterize            | 4375 ± 187                       | 317 ± 16               | **12018 ± 1989**             | 0.36x                          |
+| RandomCrop128        | 49313 ± 715                      | 2566 ± 75              | **124539 ± 2345**            | 0.40x                          |
+| RandomGamma          | **4383 ± 62**                    | 83 ± 0                 | -                            | 53.12x                         |
+| RandomResizedCrop    | **369 ± 12**                     | 309 ± 2                | 297 ± 3                      | 1.19x                          |
+| Resize               | 287 ± 4                          | **297 ± 3**            | 194 ± 1                      | 0.97x                          |
+| Rotate               | **1713 ± 27**                    | 172 ± 1                | 152 ± 10                     | 9.96x                          |
+| Sharpen              | **713 ± 9**                      | 140 ± 6                | -                            | 5.09x                          |
+| Shear                | **642 ± 11**                     | 250 ± 2                | 163 ± 6                      | 2.57x                          |
+| SmallestMaxSize      | **253 ± 4**                      | 187 ± 3                | -                            | 1.35x                          |
+| Solarize             | **4220 ± 26**                    | 339 ± 4                | 456 ± 11                     | 9.26x                          |
+| ThinPlateSpline      | **73 ± 2**                       | 62 ± 0                 | -                            | 1.17x                          |
+| VerticalFlip         | 8698 ± 122                       | 2296 ± 118             | **15409 ± 890**              | 0.56x                          |
+<!-- MULTICHANNEL_BENCHMARK_TABLE_END -->
 
-[**Detailed Video Benchmark Results**](docs/videos/README.md)
+### Video Benchmarks
 
-![Video Speedup Analysis](docs/videos/videos_speedup_analysis.webp)
+The video benchmarks compare CPU-based processing (AlbumentationsX) with GPU-accelerated processing (Kornia) for video transformations. The benchmarks use the [UCF101 dataset](https://www.crcv.ucf.edu/data/UCF101.php), which contains realistic videos from 101 action categories.
 
 <!-- VIDEO_BENCHMARK_TABLE_START -->
 | Transform            | albumentationsx (video) 2.0.18 [vid/s]   | kornia (video) 0.8.0 [vid/s]   | torchvision (video) 0.21.0 [vid/s]   | Speedup (albx/fastest other)   |
@@ -310,10 +348,6 @@ The benchmark methodology is designed to ensure fair and reproducible comparison
 3. **Measurement Phase**: Multiple runs with statistical analysis
 4. **Environment Control**: Consistent thread settings and hardware utilization
 
-For detailed methodology, see the specific benchmark READMEs:
-- [Image Benchmark Methodology](docs/images/README.md#methodology)
-- [Video Benchmark Methodology](docs/videos/README.md#methodology)
-
 ## Contributing
 
 Contributions are welcome! If you'd like to add support for a new library, improve the benchmarking methodology, or fix issues, please submit a pull request.
 
@@ -39,6 +39,12 @@
     "kornia": "benchmark/transforms/kornia_impl.py",
 }
 
+_MULTICHANNEL_IMAGE_SPECS: dict[str, str] = {
+    "albumentationsx": "benchmark/transforms/albumentationsx_multichannel_impl.py",
+    "torchvision": "benchmark/transforms/torchvision_multichannel_impl.py",
+    "kornia": "benchmark/transforms/kornia_multichannel_impl.py",
+}
+
 _VIDEO_SPECS: dict[str, str] = {
     "albumentationsx": "benchmark/transforms/albumentationsx_video_impl.py",
     "torchvision": "benchmark/transforms/torchvision_video_impl.py",
@@ -125,6 +131,7 @@ def _run_single(
     repo_root: Path,
     transforms_filter: list[str] | None = None,
     verbose: bool = False,
+    num_channels: int = 3,
 ) -> None:
     python = _ensure_venv(library, media, repo_root)
 
@@ -153,6 +160,8 @@ def _run_single(
         cmd += ["--num-items", str(num_items)]
     if max_warmup is not None:
         cmd += ["--max-warmup", str(max_warmup)]
+    if num_channels != 3:
+        cmd += ["--num-channels", str(num_channels)]
 
     import os
 
@@ -225,6 +234,12 @@ def cmd_run(args: argparse.Namespace) -> None:
     output_dir = Path(args.output)
     output_dir.mkdir(parents=True, exist_ok=True)
 
+    # --multichannel: use 9ch specs, output to output/multichannel/
+    if getattr(args, "multichannel", False) and media == "image":
+        output_dir = output_dir / "multichannel"
+        output_dir.mkdir(parents=True, exist_ok=True)
+        args.num_channels = 9
+
     # ------------------------------------------------------------------
     # Cloud path: delegate the whole run to a GCP instance
     # ------------------------------------------------------------------
@@ -252,11 +267,15 @@ def cmd_run(args: argparse.Namespace) -> None:
             repo_root=repo_root,
             transforms_filter=args.transforms,
             verbose=args.verbose,
+            num_channels=args.num_channels,
         )
         return
 
     # Built-in libraries
-    spec_map = _VIDEO_SPECS if media == "video" else _IMAGE_SPECS
+    if getattr(args, "multichannel", False) and media == "image":
+        spec_map = _MULTICHANNEL_IMAGE_SPECS
+    else:
+        spec_map = _VIDEO_SPECS if media == "video" else _IMAGE_SPECS
     available = list(spec_map.keys())
 
     requested: list[str] = args.libraries or available
@@ -285,6 +304,7 @@ def cmd_run(args: argparse.Namespace) -> None:
             repo_root=repo_root,
             transforms_filter=args.transforms,
             verbose=args.verbose,
+            num_channels=args.num_channels,
         )
 
     logger.info("All benchmarks complete. Results in: %s", output_dir)
@@ -381,6 +401,23 @@ def build_parser() -> argparse.ArgumentParser:
     run_p.add_argument("--warmup-window", type=int, default=5)
     run_p.add_argument("--warmup-threshold", type=float, default=0.05)
     run_p.add_argument("--min-warmup-windows", type=int, default=3)
+    run_p.add_argument(
+        "--num-channels",
+        type=int,
+        default=3,
+        help=(
+            "Number of image channels (must be multiple of 3). Values > 3 stack the RGB source image "
+            "to synthesize multi-channel data, e.g. 9 for 3x stacked RGB (default: 3)"
+        ),
+    )
+    run_p.add_argument(
+        "--multichannel",
+        action="store_true",
+        help=(
+            "Use multi-channel specs (9ch) and output to <output>/multichannel/. "
+            "Implies --num-channels 9 for image mode."
+        ),
+    )
 
     # ------------------------------------------------------------------
     # compare
 
@@ -18,6 +18,7 @@
     get_library_versions,
     get_system_info,
     get_video_loader,
+    make_multichannel_loader,
     time_transform,
     verify_thread_settings,
 )
@@ -81,6 +82,7 @@ def __init__(
         warmup_window: int = 5,
         warmup_threshold: float = 0.05,
         min_warmup_windows: int = 3,
+        num_channels: int = 3,
     ):
         self.library = library
         self.data_dir = Path(data_dir)
@@ -106,8 +108,11 @@ def __init__(
 
         if media_type == MediaType.IMAGE:
             self._loader = get_image_loader(library)
+            if num_channels != 3:
+                self._loader = make_multichannel_loader(self._loader, num_channels)
         else:
             self._loader = get_video_loader(library)
+        self.num_channels = num_channels
 
     # ------------------------------------------------------------------
     # Media loading
@@ -131,6 +136,8 @@ def _load_images(self) -> list[Any]:
                     img_check = cv2.imread(str(path), cv2.IMREAD_UNCHANGED)
                     if img_check is None:
                         continue
+                    # Check the on-disk image (always 3-channel RGB); the loader may
+                    # later stack channels to produce num_channels > 3 in memory.
                     if img_check.ndim < 3 or img_check.shape[2] < 3:
                         continue
 
@@ -400,6 +407,7 @@ def run(self, output_path: Path | None = None) -> dict[str, Any]:
                 "warmup_window": self.warmup_window,
                 "warmup_threshold": self.warmup_threshold,
                 "min_warmup_windows": self.min_warmup_windows,
+                "num_channels": self.num_channels,
             },
         }
 
@@ -515,6 +523,15 @@ def main() -> None:
     parser.add_argument("--warmup-window", type=int, default=5, help="Window size for variance check")
     parser.add_argument("--warmup-threshold", type=float, default=0.05, help="Variance stability threshold")
     parser.add_argument("--min-warmup-windows", type=int, default=3, help="Minimum windows to check")
+    parser.add_argument(
+        "--num-channels",
+        type=int,
+        default=3,
+        help=(
+            "Number of image channels. Must be a multiple of 3. "
+            "Values > 3 stack the RGB image to synthesize multi-channel data (default: 3)"
+        ),
+    )
 
     args = parser.parse_args()
 
@@ -547,6 +564,7 @@ def main() -> None:
         warmup_window=args.warmup_window,
         warmup_threshold=args.warmup_threshold,
         min_warmup_windows=args.min_warmup_windows,
+        num_channels=args.num_channels,
     )
 
     runner.run(args.output)