cappelletto
diff --git a/‎CMakeLists.txt‎
Lines changed: 1 addition & 1 deletion b/‎CMakeLists.txt‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎configs/sample_config.yaml‎
Lines changed: 6 additions & 0 deletions b/‎configs/sample_config.yaml‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎tests/CMakeLists.txt‎
Lines changed: 52 additions & 0 deletions b/‎tests/CMakeLists.txt‎
Lines changed: 52 additions & 0 deletions
diff --git a/‎tests/test_enhance_ops.cpp‎
Lines changed: 103 additions & 0 deletions b/‎tests/test_enhance_ops.cpp‎
Lines changed: 103 additions & 0 deletions
diff --git a/‎tests/test_enhance_stage.cpp‎
Lines changed: 32 additions & 0 deletions b/‎tests/test_enhance_stage.cpp‎
Lines changed: 32 additions & 0 deletions
diff --git a/‎tests/test_enhance_yaml.cpp‎
Lines changed: 49 additions & 0 deletions b/‎tests/test_enhance_yaml.cpp‎
Lines changed: 49 additions & 0 deletions
diff --git a/‎videostrip_cli/config_loader.cpp‎
Lines changed: 40 additions & 1 deletion b/‎videostrip_cli/config_loader.cpp‎
Lines changed: 40 additions & 1 deletion
diff --git a/‎videostrip_core/CMakeLists.txt‎
Lines changed: 3 additions & 3 deletions b/‎videostrip_core/CMakeLists.txt‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎videostrip_core/enhance_yaml.cpp‎ ‎videostrip_core/enhance/enhance_yaml.cpp‎videostrip_core/enhance_yaml.cpp renamed to videostrip_core/enhance/enhance_yaml.cpp
Lines changed: 1 addition & 1 deletion b/‎videostrip_core/enhance_yaml.cpp‎ ‎videostrip_core/enhance/enhance_yaml.cpp‎videostrip_core/enhance_yaml.cpp renamed to videostrip_core/enhance/enhance_yaml.cpp
Lines changed: 1 addition & 1 deletion
diff --git a/‎videostrip_core/enhance_yaml.hpp‎ ‎videostrip_core/enhance/enhance_yaml.hpp‎videostrip_core/enhance_yaml.hpp renamed to videostrip_core/enhance/enhance_yaml.hpp
Lines changed: 1 addition & 1 deletion b/‎videostrip_core/enhance_yaml.hpp‎ ‎videostrip_core/enhance/enhance_yaml.hpp‎videostrip_core/enhance_yaml.hpp renamed to videostrip_core/enhance/enhance_yaml.hpp
Lines changed: 1 addition & 1 deletion
@@ -1,5 +1,5 @@
 cmake_minimum_required(VERSION 3.18)
-project(videostrip VERSION 0.8.0 LANGUAGES CXX)
+project(videostrip VERSION 0.8.2 LANGUAGES CXX)
 
 set(CMAKE_CXX_STANDARD 17)
 set(CMAKE_CXX_STANDARD_REQUIRED ON)
 
@@ -21,6 +21,12 @@ processing:
   enable_logging: true
   # overlap_mode: FEATURE  # (optional, harmless for now)
 
+  feature_normalization: grid     # none|grid
+  grid_normalization:
+    cell: [32, 32]
+    max_per_cell: 50
+    score: response               # response|size
+
 enhance:
   enable: true
   sequence:
 
@@ -34,6 +34,58 @@ target_link_libraries(test_core_smoke
     ${OpenCV_LIBS}
 )
 
+# =========================
+# test_enhance_yaml
+# =========================
+add_executable(test_enhance_yaml
+  ${CMAKE_CURRENT_SOURCE_DIR}/test_enhance_yaml.cpp
+)
+target_include_directories(test_enhance_yaml PRIVATE ${TEST_COMMON_INCLUDES})
+target_link_libraries(test_enhance_yaml
+  PRIVATE
+    videostrip_core
+    Catch2::Catch2WithMain
+    yaml-cpp
+)
+catch_discover_tests(test_enhance_yaml
+  WORKING_DIRECTORY $<TARGET_FILE_DIR:test_enhance_yaml>
+)
+
+# =========================
+# test_enhance_ops
+# =========================
+add_executable(test_enhance_ops
+  ${CMAKE_CURRENT_SOURCE_DIR}/test_enhance_ops.cpp
+)
+target_include_directories(test_enhance_ops PRIVATE ${TEST_COMMON_INCLUDES})
+target_link_libraries(test_enhance_ops
+  PRIVATE
+    videostrip_core
+    Catch2::Catch2WithMain
+    ${OpenCV_LIBS}
+)
+catch_discover_tests(test_enhance_ops
+  WORKING_DIRECTORY $<TARGET_FILE_DIR:test_enhance_ops>
+)
+
+# =========================
+# test_enhance_stage
+# =========================
+add_executable(test_enhance_stage
+  ${CMAKE_CURRENT_SOURCE_DIR}/test_enhance_stage.cpp
+)
+target_include_directories(test_enhance_stage PRIVATE ${TEST_COMMON_INCLUDES})
+target_link_libraries(test_enhance_stage
+  PRIVATE
+    videostrip_core
+    Catch2::Catch2WithMain
+    ${OpenCV_LIBS}
+)
+catch_discover_tests(test_enhance_stage
+  WORKING_DIRECTORY $<TARGET_FILE_DIR:test_enhance_stage>
+)
+
+
 catch_discover_tests(test_core_smoke
   WORKING_DIRECTORY $<TARGET_FILE_DIR:test_core_smoke>
 )
 
@@ -0,0 +1,103 @@
+#include <catch2/catch_test_macros.hpp>
+#include <opencv2/core.hpp>
+// imwrite
+#include <opencv2/imgcodecs.hpp>
+#include <opencv2/imgproc.hpp>
+
+#include <videostrip_core/enhance/image_enhancers.hpp>
+
+using namespace videostrip;
+
+static cv::Mat toy2x2() {
+    cv::Mat m(2,2,CV_8UC3);
+    m.at<cv::Vec3b>(0,0) = {10,20,30};
+    m.at<cv::Vec3b>(0,1) = {40,50,60};
+    m.at<cv::Vec3b>(1,0) = {70,80,90};
+    m.at<cv::Vec3b>(1,1) = {100,110,120};
+    return m;
+}
+
+TEST_CASE("ContrastOffset exactness", "[enhance][ops]") {
+    cv::Mat m = toy2x2();
+    Enhancer e;
+    e.setSequence({ {EnhanceType::ContrastOffset, ContrastOffsetParams{2.0, 10.0}} });
+    REQUIRE(e.apply(m));
+    auto expect = [&](int r,int c){
+        auto v = m.at<cv::Vec3b>(r,c);
+        auto in = toy2x2().at<cv::Vec3b>(r,c);
+        for (int k=0;k<3;++k) {
+            int ref = std::min(255, std::max(0, int(2*in[k] + 10)));
+            CHECK(v[k] == ref);
+        }
+    };
+    expect(0,0); expect(0,1); expect(1,0); expect(1,1);
+}
+
+TEST_CASE("GrayWorld balances means", "[enhance][ops]") {
+    cv::Mat m(32,32,CV_8UC3, cv::Scalar(10, 50, 200)); // B,G,R
+    Enhancer e;
+    e.setSequence({ {EnhanceType::GrayWorldWB, GrayWorldParams{}} });
+    REQUIRE(e.apply(m));
+    cv::Scalar mean = cv::mean(m);
+    CHECK(std::abs(mean[0] - mean[1]) <= 1.5);
+    CHECK(std::abs(mean[1] - mean[2]) <= 1.5);
+}
+
+TEST_CASE("Gamma LUT monotonic and anchors", "[enhance][ops]") {
+    cv::Mat m(1,4,CV_8UC3);
+    m.at<cv::Vec3b>(0,0) = {0,0,0};
+    m.at<cv::Vec3b>(0,1) = {64,64,64};
+    m.at<cv::Vec3b>(0,2) = {128,128,128};
+    m.at<cv::Vec3b>(0,3) = {255,255,255};
+    Enhancer e;
+    e.setSequence({ {EnhanceType::Gamma, GammaParams{2.0}} });
+    REQUIRE(e.apply(m));
+    CHECK(m.at<cv::Vec3b>(0,0) == cv::Vec3b(0,0,0));
+    CHECK(m.at<cv::Vec3b>(0,3) == cv::Vec3b(255,255,255));
+    CHECK(m.at<cv::Vec3b>(0,1)[0] < m.at<cv::Vec3b>(0,2)[0]); // monotonic
+    CHECK(m.at<cv::Vec3b>(0,2)[0] > 128); // compressed mid-tones
+}
+
+// TEST_CASE("CLAHE increases gray stddev", "[enhance][ops]") {
+//     // if we use uniform input image clahe does nothing
+//     // so we use a mid-gray image and check that CLAHE increases contrast
+//     cv::Mat m(64,64,CV_8UC3, cv::Scalar(60,60,60));        // we operate on grayscale percentiles, assuming CLAHE will increase luminance range
+//     // Then set a darker square in the middle (16x16)
+//     for (int r=24; r<40; ++r) {
+//         uchar* row = m.ptr<uchar>(r);
+//         for (int c=24; c<40; ++c) {
+//             row[3*c+0] = 30;
+//             row[3*c+1] = 30;
+//             row[3*c+2] = 30;
+//         }
+//     }
+//     cv::imwrite("clahe_input.png", m);
+//     // lambda with quick histogram estimation of percentiles
+//     auto pctl = [](const cv::Mat& img, double p)->int {
+//         cv::Mat g; cv::cvtColor(img, g, cv::COLOR_BGR2GRAY);
+//         int hist[256] = {0};
+//         for (int r=0; r<g.rows; ++r) {
+//             const uchar* row = g.ptr<uchar>(r);
+//             for (int c=0; c<g.cols; ++c) ++hist[row[c]];
+//         }
+//         const int N = g.rows * g.cols;
+//         const int target = int(std::round(p * N));
+//         int acc = 0;
+//         for (int v=0; v<256; ++v) { acc += hist[v]; if (acc >= target) return v; }
+//         return 255;
+//     };
+
+//     int before_p10 = pctl(m, 0.10);
+//     int before_p90 = pctl(m, 0.90);
+
+//     Enhancer e;
+//     e.setSequence({ {EnhanceType::CLAHE, ClaheParams{2.0, {8,8}, ClaheSpace::YCrCb}} });
+//     REQUIRE(e.apply(m));
+
+//     int after_p10 = pctl(m, 0.10);
+//     int after_p90 = pctl(m, 0.90);
+
+//     cv::imwrite("clahe_output.png", m);
+//     // CLAHE should increase dynamic range in luminance percentiles
+//     CHECK((after_p90 - after_p10) > (before_p90 - before_p10));
+// }
@@ -0,0 +1,32 @@
+#include <catch2/catch_test_macros.hpp>
+#include <opencv2/core.hpp>
+#include <opencv2/imgproc.hpp>
+
+#include <videostrip_core/enhance/pipeline_enhance.hpp>
+#include <videostrip_core/enhance/enhance_yaml.hpp>
+
+using namespace videostrip;
+
+TEST_CASE("EnhanceStage: converts to 8UC3 and applies sequence", "[enhance][stage]") {
+    // Start with 16U gray; stage should convert and then process
+    cv::Mat src16(32,32,CV_16UC1);
+    for (int r=0;r<src16.rows;++r)
+        for (int c=0;c<src16.cols;++c)
+            src16.at<uint16_t>(r,c) = uint16_t((r*32 + c) % 1024);
+
+    cv::Mat frame = src16; // deliberately non-8UC3 input
+
+    EnhanceConfig cfg;
+    cfg.enable = true;
+    cfg.sequence = {
+        { EnhanceType::GrayWorldWB, GrayWorldParams{} },
+        { EnhanceType::Gamma,       GammaParams{1.2} }
+    };
+
+    EnhanceStage stage;
+    std::string err;
+    REQUIRE(stage.configure(cfg, err));
+    REQUIRE(stage.process(frame));
+    CHECK(frame.type() == CV_8UC3);
+    CHECK(frame.channels() == 3);
+}
@@ -0,0 +1,49 @@
+#include <catch2/catch_test_macros.hpp>
+#include <yaml-cpp/yaml.h>
+#include <string>
+
+#include <videostrip_core/enhance/enhance_yaml.hpp>
+
+using namespace videostrip;
+
+TEST_CASE("enhance yaml: valid sequence parses", "[enhance][yaml]") {
+    const char* y = R"YAML(
+enhance:
+  enable: true
+  sequence:
+    - type: contrast
+      alpha: 1.1
+      beta: -5
+    - type: grayworld
+    - type: gamma
+      value: 1.05
+    - type: clahe
+      clip_limit: 2.0
+      tile_grid: [8, 8]
+      space: YCrCb
+)YAML";
+    YAML::Node root = YAML::Load(y);
+    std::string err;
+    auto cfg = parseEnhanceConfig(root, err);
+    REQUIRE(cfg.has_value());
+    CHECK(cfg->enable == true);
+    REQUIRE(cfg->sequence.size() == 4);
+    CHECK(cfg->sequence[0].type == EnhanceType::ContrastOffset);
+    CHECK(cfg->sequence[1].type == EnhanceType::GrayWorldWB);
+    CHECK(cfg->sequence[2].type == EnhanceType::Gamma);
+    CHECK(cfg->sequence[3].type == EnhanceType::CLAHE);
+}
+
+TEST_CASE("enhance yaml: malformed op fails", "[enhance][yaml]") {
+    const char* y = R"YAML(
+enhance:
+  enable: true
+  sequence:
+    - type: i_do_not_exist
+)YAML";
+    YAML::Node root = YAML::Load(y);
+    std::string err;
+    auto cfg = parseEnhanceConfig(root, err);
+    CHECK_FALSE(cfg.has_value());
+    CHECK(err.find("Unknown") != std::string::npos);
+}
@@ -4,7 +4,7 @@
 #include <yaml-cpp/yaml.h>
 
 #include <videostrip_cli/config_loader.hpp>
-#include <videostrip_core/enhance_yaml.hpp>
+#include <videostrip_core/enhance/enhance_yaml.hpp>
 
 namespace fs = std::filesystem;
 
@@ -89,6 +89,38 @@ bool load_yaml_config(const std::string& yaml_path,
                 // e.g., out.overlap_mode = v.as<std::string>();
                 // Ignored if not present in struct.
             }
+
+            // NEW: feature normalization, see #23
+            // -----------------------------
+            using videostrip::FeatureNormalizationMode;
+            using videostrip::GridNormalizationParams;
+            // mode: none|grid
+            if (auto v = n["feature_normalization"]; v && v.IsScalar()) {
+                std::string s = v.as<std::string>();
+                std::transform(s.begin(), s.end(), s.begin(), ::tolower);
+                out.feature_normalization.mode =
+                    (s == "grid") ? FeatureNormalizationMode::Grid
+                                  : FeatureNormalizationMode::None;
+            }
+            // grid_normalization: { cell:[w,h], max_per_cell:int, score:response|size }
+            if (auto gn = n["grid_normalization"]; gn && gn.IsMap()) {
+                if (auto cell = gn["cell"]; cell && cell.IsSequence() && cell.size() == 2) {
+                    out.feature_normalization.grid.cell_w = std::max(1, cell[0].as<int>(32));
+                    out.feature_normalization.grid.cell_h = std::max(1, cell[1].as<int>(32));
+                }
+                if (auto mpc = gn["max_per_cell"]; mpc && mpc.IsScalar()) {
+                    out.feature_normalization.grid.max_per_cell = std::max(1, mpc.as<int>(50));
+                }
+                if (auto sc = gn["score"]; sc && sc.IsScalar()) {
+                    std::string ss = sc.as<std::string>();
+                    std::transform(ss.begin(), ss.end(), ss.begin(), ::tolower);
+                    out.feature_normalization.grid.score =
+                        (ss == "size")
+                        ? GridNormalizationParams::Score::Size
+                        : GridNormalizationParams::Score::Response; // default
+                }
+            }
+
         }
 
         // Normalize outputs (relative -> base_dir)
@@ -193,6 +225,13 @@ void merge_yaml_into(ExtractorConfig& dst, const ExtractorConfig& y)
     dst.enable_logging     = y.enable_logging;
     dst.enhance            = y.enhance;
 
+    // check if there is a normalization mode set in the yaml config
+    // if so, copy the entire normalization config
+    // if not, leave dst as-is (probably None)
+
+    dst.feature_normalization.mode = y.feature_normalization.mode;
+    dst.feature_normalization.grid = y.feature_normalization.grid;
+
     // Optional future field:
     // if (!y.overlap_mode.empty()) dst.overlap_mode = y.overlap_mode;
 }
 
@@ -5,9 +5,9 @@ message(STATUS "*******************")
 
 add_library(videostrip_core STATIC
     videostrip_core.cpp
-    image_enhancers.cpp
-    enhance_yaml.cpp
-    pipeline_enhance.cpp
+    enhance/image_enhancers.cpp
+    enhance/enhance_yaml.cpp
+    enhance/pipeline_enhance.cpp
     feature/feature_extractor.cpp
     keyframe/keyframe_selector.cpp
     io/metadata_writer.cpp
 
@@ -1,5 +1,5 @@
 #include <algorithm>
-#include <videostrip_core/enhance_yaml.hpp>
+#include <videostrip_core/enhance/enhance_yaml.hpp>
 
 namespace videostrip {
 
 
@@ -3,7 +3,7 @@
 #include <optional>
 #include <string>
 
-#include <videostrip_core/image_enhancers.hpp>
+#include <videostrip_core/enhance/image_enhancers.hpp>
 
 namespace videostrip {