3DOM-FBK
diff --git a/‎assets/example_cyprus/cameras.yaml‎
Lines changed: 1 addition & 1 deletion b/‎assets/example_cyprus/cameras.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎config/cameras.yaml‎
Lines changed: 17 additions & 2 deletions b/‎config/cameras.yaml‎
Lines changed: 17 additions & 2 deletions
diff --git a/‎config/rotations.txt‎
Lines changed: 10 additions & 0 deletions b/‎config/rotations.txt‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎demo.py‎
Lines changed: 9 additions & 4 deletions b/‎demo.py‎
Lines changed: 9 additions & 4 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 1 addition & 0 deletions b/‎pyproject.toml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎scripts/resize_images.py‎
Lines changed: 1 addition & 1 deletion b/‎scripts/resize_images.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎scripts/show_matches.py‎
Lines changed: 144 additions & 18 deletions b/‎scripts/show_matches.py‎
Lines changed: 144 additions & 18 deletions
diff --git a/‎src/deep_image_matching/config.py‎
Lines changed: 5 additions & 2 deletions b/‎src/deep_image_matching/config.py‎
Lines changed: 5 additions & 2 deletions
@@ -11,7 +11,7 @@ cam0: # This camera is used for the image rotated by 90 degrees. You need to def
   intrinsics: [
     1200, 1200, 500, 750
   ]
-  images : "DSC_6471.JPG"
+  images : "*.JPG"
 
 
 # cam1: # This camera is used for the image rotated by 180 degrees. This is not necessary, you can use the same camera model as the general one.
 
@@ -1,5 +1,20 @@
 general:
   camera_model: "simple-radial" # ["simple-pinhole", "pinhole", "simple-radial", "opencv"]
   openmvg_camera_model: "pinhole_radial_k3" # ["pinhole", "pinhole_radial_k3", "pinhole_brown_t2"]
-  single_camera: True
-  intrinsics: ~  # None
+  single_camera: False
+  intrinsics: ~  # None
+
+cam0:
+  camera_model: "pinhole"
+  intrinsics: [
+    1200, 1200, 500, 750
+  ]
+  images : "*.JPG"
+
+
+cam1:
+  camera_model: "pinhole"
+  intrinsics: [
+    1200, 1200, 750, 500
+  ]  
+  images : "DSC_6468.JPG,DSC_6469.JPG"
@@ -0,0 +1,10 @@
+DSC_6466.JPG 0
+DSC_6467.JPG 0
+DSC_6468.JPG 180
+DSC_6469.JPG 0
+DSC_6470.JPG 0
+DSC_6471.JPG 90
+DSC_6472.JPG 0
+DSC_6473.JPG 0
+DSC_6474.JPG 0
+DSC_6475.JPG 0
@@ -14,13 +14,18 @@
 # Define the configuration parameters
 args = {
     "dir": "./assets/example_cyprus",
-    "pipeline": "superpoint+lightglue",
-    "strategy": "bruteforce",
-    "quality": "medium",
-    "tiling": "none",
+    "pipeline": "superpoint+lightglue", # ["superpoint+lightglue", "superpoint+lightglue_fast", "superpoint+superglue", "superpoint+kornia_matcher", "disk+lightglue", "aliked+lightglue", "orb+kornia_matcher", "sift+kornia_matcher", "loftr", "se2loftr", "roma", "srif", "keynetaffnethardnet+kornia_matcher", "dedode+kornia_matcher"]
+    "strategy": "bruteforce", # ["matching_lowres", "bruteforce", "sequential", "retrieval", "custom_pairs", "covisibility"]
+    "quality": "medium", # ["lowest", "low", "medium", "high", "highest"]
+    "tiling": "none", # ["none", "preselection", "grid", "exhaustive"]
     "camera_options": "./assets/example_cyprus/cameras.yaml",
     "openmvg": None,
     "force": True,  # Remove existing features and matches
+    "skip_reconstruction": False,
+    "graph": True,
+    #"upright": "custom", # ["custom", "2clusters", "exif"] With "custom" option, rotations must be specified in ./config/rotations.txt
+    #"config_file": "./config_superpoint_lightglue.yaml", # Path to custom config file (YAML format) for matcher
+    "verbose": False,
 }
 
 # Alternatively, you can parse the parameters from the command line with
 
@@ -27,6 +27,7 @@ dependencies = [
   "torch",
   "torchvision",
   "pillow",
+  "rasterio",
   "opencv-python",
   "opencv-contrib-python",
   "pydegensac==0.1.3; platform_system=='Windows' and platform_machine=='i386'",
 
@@ -11,7 +11,7 @@ def resize_images(input_folder, output_folder, new_resolution):
 
     # Loop through all files in the input folder
     for filename in os.listdir(input_folder):
-        if filename.endswith((".jpg", ".jpeg", ".png", ".gif", ".tif")):
+        if filename.endswith((".jpg", ".JPG", ".jpeg", ".JPEG", ".png", ".PNG", ".gif", ".GIF", ".tif", ".TIF", ".tiff", ".TIFF")):
             input_path = os.path.join(input_folder, filename)
             output_path = os.path.join(output_folder, filename)
 
 
@@ -5,6 +5,7 @@
 
 import cv2
 import numpy as np
+import rasterio
 
 from deep_image_matching.utils.database import (
     COLMAPDatabase,
@@ -151,7 +152,7 @@ def ShowColmapMatches(self, plot_config: dict):
             img1_path,
             keypoints0,
             keypoints1,
-            self.two_views_matches[(id0, id1)],
+            self.matches[(id0, id1)], #"self.two_views_matches[(id0, id1)]," or "self.matches[(id0, id1)],"
             plot_config,
         )
 
@@ -169,13 +170,90 @@ def GeneratePlot(
         thickness = plot_config["thickness"]
         space_between_images = plot_config["space_between_images"]
 
-        # Load images
-        img0 = cv2.imread(str(img0_path))
-        img1 = cv2.imread(str(img1_path))
-
-        # Convert keypoints to integers
-        kpts0_int = np.round(kpts0).astype(int)
-        kpts1_int = np.round(kpts1).astype(int)
+        # Load images using rasterio
+        def load_image_with_rasterio(img_path):
+            with rasterio.open(str(img_path)) as src:
+                img_data = src.read()
+                # Convert from (bands, rows, cols) to (rows, cols, bands)
+                img = np.transpose(img_data, (1, 2, 0))
+                
+                # Handle different number of bands
+                if img.shape[2] == 1:
+                    # Single band - convert to 3-channel grayscale
+                    img = np.repeat(img, 3, axis=2)
+                elif img.shape[2] > 3:
+                    # More than 3 bands - take first 3 (typically RGB)
+                    img = img[:, :, :3]
+                
+                # Convert to uint8 if needed
+                if img.dtype != np.uint8:
+                    # Normalize to 0-255 range if values are in different range
+                    if img.max() <= 1.0:
+                        img = (img * 255).astype(np.uint8)
+                    else:
+                        img = np.clip(img, 0, 255).astype(np.uint8)
+                
+                ## Convert RGB to BGR for OpenCV compatibility (if 3 channels)
+                #if img.shape[2] == 3:
+                #    img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
+                
+                return img
+        
+        img0 = load_image_with_rasterio(img0_path)
+        img1 = load_image_with_rasterio(img1_path)
+
+        # Check if images are too large and resize if necessary
+        max_dimension = plot_config.get("max_dimension", 4000)  # Maximum dimension for visualization
+        scale_factor0 = 1.0
+        scale_factor1 = 1.0
+        
+        # Calculate scale factors for each image
+        if max(img0.shape[:2]) > max_dimension:
+            scale_factor0 = max_dimension / max(img0.shape[:2])
+            new_size0 = (int(img0.shape[1] * scale_factor0), int(img0.shape[0] * scale_factor0))
+            img0 = cv2.resize(img0, new_size0, interpolation=cv2.INTER_AREA)
+            print(f"Resized img0 by factor {scale_factor0:.3f} to {img0.shape[1]}x{img0.shape[0]}")
+            
+        if max(img1.shape[:2]) > max_dimension:
+            scale_factor1 = max_dimension / max(img1.shape[:2])
+            new_size1 = (int(img1.shape[1] * scale_factor1), int(img1.shape[0] * scale_factor1))
+            img1 = cv2.resize(img1, new_size1, interpolation=cv2.INTER_AREA)
+            print(f"Resized img1 by factor {scale_factor1:.3f} to {img1.shape[1]}x{img1.shape[0]}")
+
+        # Scale keypoints to match resized images
+        kpts0_scaled = kpts0 * scale_factor0
+        kpts1_scaled = kpts1 * scale_factor1
+
+        # Filter out invalid keypoints (NaN, inf) and convert to integers
+        valid_mask0 = np.isfinite(kpts0_scaled).all(axis=1)
+        valid_mask1 = np.isfinite(kpts1_scaled).all(axis=1)
+        
+        kpts0_valid = kpts0_scaled[valid_mask0]
+        kpts1_valid = kpts1_scaled[valid_mask1]
+        
+        kpts0_int = np.round(kpts0_valid).astype(int)
+        kpts1_int = np.round(kpts1_valid).astype(int)
+        
+        print(f"Valid keypoints - Img0: {len(kpts0_int)}/{len(kpts0)}, Img1: {len(kpts1_int)}/{len(kpts1)}")
+
+        # Calculate final visualization size and check memory requirements
+        final_height = max(img0.shape[0], img1.shape[0])
+        final_width = img0.shape[1] + img1.shape[1] + space_between_images
+        estimated_memory_gb = (final_height * final_width * 3) / (1024**3)
+        
+        print(f"Final visualization size: {final_width}x{final_height} ({estimated_memory_gb:.2f} GB)")
+        
+        if estimated_memory_gb > 8.0:  # If still too large after resizing
+            print("Warning: Visualization still requires significant memory. Consider using smaller max_dimension.")
+            additional_scale = min(1.0, 8.0 / estimated_memory_gb)
+            if additional_scale < 1.0:
+                new_size0 = (int(img0.shape[1] * additional_scale), int(img0.shape[0] * additional_scale))
+                new_size1 = (int(img1.shape[1] * additional_scale), int(img1.shape[0] * additional_scale))
+                img0 = cv2.resize(img0, new_size0, interpolation=cv2.INTER_AREA)
+                img1 = cv2.resize(img1, new_size1, interpolation=cv2.INTER_AREA)
+                kpts0_int = np.round(kpts0_int * additional_scale).astype(int)
+                kpts1_int = np.round(kpts1_int * additional_scale).astype(int)
+                print(f"Applied additional scaling factor {additional_scale:.3f}")
 
         # Create a new image to draw matches
         img_matches = np.zeros(
@@ -193,19 +271,58 @@ def GeneratePlot(
         ] = (255, 255, 255)
 
         if show_keypoints:
-            # Show keypoints
+            # Show valid keypoints within image bounds
             for kpt in kpts0_int:
-                kpt = tuple(kpt)
-                cv2.circle(img_matches, kpt, radius, (0, 0, 255), thickness)
+                if 0 <= kpt[0] < img0.shape[1] and 0 <= kpt[1] < img0.shape[0]:
+                    kpt_tuple = tuple(kpt)
+                    cv2.circle(img_matches, kpt_tuple, radius, (0, 0, 255), thickness)
 
             for kpt in kpts1_int:
-                kpt = tuple(kpt + np.array([img0.shape[1], 0]))
-                cv2.circle(img_matches, kpt, radius, (0, 0, 255), thickness)
-
-        # Draw lines and circles for matches
+                kpt_shifted = kpt + np.array([img0.shape[1] + space_between_images, 0])
+                if (0 <= kpt[0] < img1.shape[1] and 0 <= kpt[1] < img1.shape[0] and
+                    0 <= kpt_shifted[0] < img_matches.shape[1] and 0 <= kpt_shifted[1] < img_matches.shape[0]):
+                    kpt_tuple = tuple(kpt_shifted)
+                    cv2.circle(img_matches, kpt_tuple, radius, (0, 0, 255), thickness)
+
+        # Filter matches to only include those with valid keypoints and within image bounds
+        valid_matches = []
+        
+        # Create mapping from original indices to filtered indices
+        valid_idx0_map = {}
+        valid_idx1_map = {}
+        
+        for i, is_valid in enumerate(valid_mask0):
+            if is_valid:
+                valid_idx0_map[i] = len(valid_idx0_map)
+                
+        for i, is_valid in enumerate(valid_mask1):
+            if is_valid:
+                valid_idx1_map[i] = len(valid_idx1_map)
+        
         for match in matches:
-            pt1 = tuple(kpts0_int[match[0]])
-            pt2 = tuple(np.array(kpts1_int[match[1]]) + np.array([img0.shape[1], 0]))
+            orig_idx0, orig_idx1 = match[0], match[1]
+            
+            # Check if both original indices had valid keypoints
+            if orig_idx0 in valid_idx0_map and orig_idx1 in valid_idx1_map:
+                new_idx0 = valid_idx0_map[orig_idx0]
+                new_idx1 = valid_idx1_map[orig_idx1]
+                
+                # Check if indices are within filtered arrays
+                if new_idx0 < len(kpts0_int) and new_idx1 < len(kpts1_int):
+                    kpt0 = kpts0_int[new_idx0]
+                    kpt1 = kpts1_int[new_idx1]
+                    
+                    # Check if keypoints are within image bounds
+                    if (0 <= kpt0[0] < img0.shape[1] and 0 <= kpt0[1] < img0.shape[0] and
+                        0 <= kpt1[0] < img1.shape[1] and 0 <= kpt1[1] < img1.shape[0]):
+                        valid_matches.append((new_idx0, new_idx1))
+        
+        print(f"Valid matches: {len(valid_matches)}/{len(matches)}")
+        
+        # Draw lines and circles for valid matches
+        for idx0, idx1 in valid_matches:
+            pt1 = tuple(kpts0_int[idx0])
+            pt2 = tuple(kpts1_int[idx1] + np.array([img0.shape[1] + space_between_images, 0]))
 
             # Draw a line connecting the keypoints
             cv2.line(img_matches, pt1, pt2, (0, 255, 0), thickness)
@@ -274,20 +391,29 @@ def parse_args():
         required=False,
         default=1500,
     )
+    parser.add_argument(
+        "--max_dimension",
+        type=int,
+        help="Maximum dimension (width or height) for individual images before visualization",
+        required=False,
+        default=4000,
+    )
     args = parser.parse_args()
 
     return args
 
 
 def main():
+    args = parse_args()
+    
     plot_config = {
         "show_keypoints": True,
         "radius": 5,
         "thickness": 2,
         "space_between_images": 0,
+        "max_dimension": args.max_dimension,
     }
 
-    args = parse_args()
     database_path = Path(args.database)
     out_dir = Path(args.output)
     imgs_dir = Path(args.imgsdir)
 
@@ -62,15 +62,18 @@
     # Overlap between tiles in pixels
     "tile_overlap": 10,
     # Size of the low resolution tiles used for the tile preselection
-    "tile_preselection_size": 1000,
+    "tile_preselection_size": 2000,
     # Minimum number of matches per tile
     "min_matches_per_tile": 10,
+    # Use geomertic verification for each tile pair (if tiling is used)
+    "geometric_verification_per_tile": True,
+    "gv_threshold_in_tiles_matching": 4,
     # Geometric verification method and parameters:
     #   GeometricVerification.NONE (no geometric verification),
     #   GeometricVerification.PYDEGENSAC (use pydegensac),
     #   GeometricVerification.MAGSAC (use opencv MAGSAC),
     #   Other methods: RANSAC, LMEDS, RHO, USAC_DEFAULT, USAC_PARALLEL, USAC_FM_8PTS, USAC_FAST, USAC_ACCURATE, USAC_PROSAC, USAC_MAGSAC
-    "geom_verification": GeometricVerification.PYDEGENSAC,
+    "geom_verification": GeometricVerification.MAGSAC,
     "gv_threshold": 4,
     "gv_confidence": 0.99999,
     # Minimum number of inliers matches and minumum inlier ratio per pair
Original file line number	Diff line number	Diff line change
`@@ -11,7 +11,7 @@ cam0: # This camera is used for the image rotated by 90 degrees. You need to def`
`11`	`11`	`intrinsics: [`
`12`	`12`	`1200, 1200, 500, 750`
`13`	`13`	`]`
`14`		`- images : "DSC_6471.JPG"`
	`14`	`+ images : "*.JPG"`
`15`	`15`
`16`	`16`
`17`	`17`	`# cam1: # This camera is used for the image rotated by 180 degrees. This is not necessary, you can use the same camera model as the general one.`