verbose of Euler Characterstics with torch guarded

sambit-giri · sambit-giri · commit 493eed8dfa1e · 2025-07-23T15:11:53.000+02:00
diff --git a/example/benchmark_euler_char_speed.py b/example/benchmark_euler_char_speed.py
@@ -0,0 +1,93 @@
+import numpy as np
+import time
+import os
+import gc
+
+from tools21cm import topology
+
+def create_test_data(box_dim=128):
+    """Creates a reasonably complex 3D binary array for testing."""
+    print(f"Generating a {box_dim}x{box_dim}x{box_dim} test data cube...")
+    arr = np.zeros((box_dim, box_dim, box_dim), dtype=np.int32)
+    
+    # A solid core
+    size = box_dim // 4
+    start = box_dim // 2 - size // 2
+    end = start + size
+    arr[start:end, start:end, start:end] = 1
+    
+    # Random noise to make it less trivial
+    noise = np.random.randint(0, 200, size=arr.shape)
+    arr[noise > 198] = 1
+    print(f"Test data generated with {arr.sum()} active cells.\n")
+    return arr
+
+if __name__ == "__main__":
+    # --- Setup ---
+    BOX_DIM = 32 #128
+    test_data = create_test_data(BOX_DIM)
+    timings = {}
+
+    # Define the backends to test
+    backends_to_test = ['python', 'numba', 'cython', 'torch']
+    chi_results = {}
+    for backend in backends_to_test:
+        print(f"--- Benchmarking '{backend}' Backend ---")
+        
+        # Check if the backend is available
+        available = False
+        if backend == 'python': available = True
+        elif backend == 'numba' and topology.VB.numba_available: available = True
+        elif backend == 'cython' and topology.VB.cython_available: available = True
+        elif backend == 'torch' and topology.VB.torch_available: available = True
+
+        if not available:
+            print(f"   Backend not available. Skipping.\n")
+            continue
+
+        # For parallel Cython, set thread count to max
+        if backend == 'cython':
+            n_threads = os.cpu_count()
+            os.environ['OMP_NUM_THREADS'] = str(n_threads)
+            print(f"   (Using {n_threads} threads for Cython/OpenMP)")
+
+        # Perform a warm-up run for JIT or GPU backends
+        if backend in ['numba', 'torch']:
+            print("   (Warm-up run...)")
+            topology.EulerCharacteristic(test_data, speed_up=backend, verbose=False)
+
+        # Run the actual benchmark
+        print("   (Benchmarking run...)")
+        t_start = time.time()
+        chi_value = topology.EulerCharacteristic(test_data, speed_up=backend, verbose=True)
+        t_end = time.time()
+        
+        duration = t_end - t_start
+        timings[backend] = duration
+        
+        print(f"   Result Chi = {chi_value}, Time = {duration:.4f} seconds\n")
+        chi_results[backend] = chi_value
+        gc.collect()
+
+    # Clean up environment variable
+    if 'OMP_NUM_THREADS' in os.environ:
+        del os.environ['OMP_NUM_THREADS']
+        
+    # --- Final Summary ---
+    print("="*65)
+    print("                    Backend Benchmark Summary")
+    print("="*65)
+    if timings:
+        sorted_results = sorted(timings.items(), key=lambda item: item[1])
+        baseline_time = timings.get('python', 1e-9)
+        
+        # Add the 'Chi Value' column to the header
+        print(f"{'Implementation':<20} | {'Chi Value':<12} | {'Time (s)':<15} | {'Speedup'}")
+        print("-"*65)
+        
+        for name, t in sorted_results:
+            chi_val = chi_results.get(name, 'N/A') 
+            speedup = baseline_time / t
+            print(f"{name:<20} | {chi_val:<12.0f} | {t:<15.4f} | {speedup:.2f}x")
+    else:
+        print("No backends were benchmarked.")
diff --git a/src/tools21cm/ViteBetti.py b/src/tools21cm/ViteBetti.py
@@ -34,6 +34,7 @@ def jit(func, *args, **kwargs):
 try:
     import torch
     torch_available = True
+    torch_device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 except ImportError:
     torch_available = False
     torch = None
@@ -203,20 +204,17 @@ def CubeMap_joblib(arr, multi_marker=True, n_jobs=-1):
     return result_cubemap
 
 # --- PyTorch GPU Implementation ---
-def CubeMap_torch(arr, multi_marker=True):
+def CubeMap_torch(arr, multi_marker=True, verbose=False):
     """
     Generates a cubical complex map using PyTorch for GPU acceleration.
     """
     if not torch_available:
         raise ImportError("PyTorch is not installed. Cannot use 'torch' backend.")
 
-    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
-    print(f"Using PyTorch on device: {device}")
-
-    arr_tensor = torch.tensor(arr, dtype=torch.int32, device=device)
+    arr_tensor = torch.tensor(arr, dtype=torch.int32, device=torch_device)
     nx, ny, nz = arr_tensor.shape
     Nx, Ny, Nz = 2 * nx, 2 * ny, 2 * nz
-    cubemap = torch.zeros((Nx, Ny, Nz), dtype=torch.int32, device=device)
+    cubemap = torch.zeros((Nx, Ny, Nz), dtype=torch.int32, device=torch_device)
 
     markers = (1, 1, 1, 1)
     if multi_marker:
diff --git a/src/tools21cm/topology.py b/src/tools21cm/topology.py
@@ -44,6 +44,8 @@ def EulerCharacteristic(data, thres=0.5, neighbors=6, speed_up='cython', verbose
 	elif speed_up.lower() == 'numba' and VB.numba_available:
 		C = VB.CubeMap_numba(A)
 	elif speed_up.lower() == 'torch' and VB.torch_available:
+		if verbose:
+			print(f"device={VB.torch_device}...", end="")
 		C = VB.CubeMap_torch(A)
 	else:
 		if speed_up.lower() not in ['numpy', 'python']: