adressed pr feedback: small docstrings for mlp.py, check for shifter and mlp usage

nathanpaul.soeding · nathanpaul.soeding · commit 3f56f53dfee6 · 2025-10-03T11:23:44.000+02:00
diff --git a/neuralpredictors/layers/encoders/firing_rate.py b/neuralpredictors/layers/encoders/firing_rate.py
@@ -68,8 +68,12 @@ def forward(
         x = inputs
 
         if self.perspective:
+            if self.shifter:
+                raise ValueError("both perspective and shifter cannot be present together, only one should be chosen")
+            
             if pupil_center is None:
                 raise ValueError("pupil_center is not given")
+            
             x = self.perspective[data_key](x, pupil_center)
 
         x = self.core(x)
diff --git a/neuralpredictors/layers/perspective/mlp.py b/neuralpredictors/layers/perspective/mlp.py
@@ -1,8 +1,22 @@
+'''
+code is adjusted from the Wang et al 2025 "Foundation model of neural activity predicts response to new stimulus types" implementation
+Specifically
+* https://github.com/cajal/fnn/blob/main/fnn/model/pixels.py
+* https://github.com/cajal/fnn/blob/main/fnn/model/perspectives.py
+'''
 import torch
 from torch import nn
 
-
 def angles_to_rmat3d(angles):
+    """
+    Convert batches of Euler angles (x, y, z) to 3D rotation matrices.
+
+    Args:
+        angles (torch.Tensor): Tensor of shape (N, 3), angles in radians.
+
+    Returns:
+        torch.Tensor: Tensor of shape (N, 3, 3), rotation matrices (Rz * Ry * Rx).
+    """
     x, y, z = torch.unbind(angles, axis=-1)
     N = len(x)
 
@@ -38,6 +52,9 @@ def angles_to_rmat3d(angles):
 
 
 class PixelTransform(nn.Module):
+    """
+    Nonlinear pixel intensity transform with learnable power, scale, and offset.
+    """
     def __init__(self, max_power=1, init_scale=1, init_offset=0, eps=1e-5):
         super().__init__()
 
@@ -54,21 +71,23 @@ def power(self):
 
     def forward(self, pixels):
         return pixels.add(self.eps).pow(self.power).mul(self.scale).add(self.offset)
-
-
-class Scale(nn.Module):
-    def __init__(self, gamma):
-        super().__init__()
-        self.gamma = gamma
-
-    def forward(self, x):
-        return x * self.gamma
-
+    
 
 class Retina(nn.Module):
+    """
+    Models a retina that maps pupil centers to 3D rays via an MLP.
+
+    Args:
+        degree (float): Field of view in degrees.
+        height, width (int): Retina grid resolution.
+        dim_in, dim_out (int): Input/output dimensions for MLP.
+        mlp_features (int): Hidden feature size.
+        mlp_layers (int): Number of MLP layers.
+        max_angle (float): Maximum rotation angle in degrees.
+    """
     def __init__(
         self,
-        degree=75,
+        degree=50,
         height=36,
         width=64,
         dim_in=2,
@@ -148,6 +167,11 @@ def rays(self, pupil_center):
 
 
 class Monitor(nn.Module):
+    """
+    Models a monitor in 3D space with optimizable position and orientation.
+
+    Provides projection of retinal rays onto the monitor plane and sampling of images.
+    """
     def __init__(
         self,
         init_center_x=0,
@@ -235,6 +259,9 @@ def sample_screen(self, img, grid):
 
 
 class SinglePerspective(nn.Module):
+    """
+    Combines Retina, Monitor, and PixelTransform to generate a single visual perspective.
+    """
     def __init__(self, retina, monitor, pixel_transform, static_power=1.7):
         super().__init__()
 
@@ -263,6 +290,9 @@ def forward(self, img, pupil_center):
 
 
 class Perspective(nn.ModuleDict):
+    """
+    Container for multiple SinglePerspective modules keyed by dataset identifiers.
+    """
     def __init__(self, data_keys, retina_degree=75, mlp_features=16, mlp_layers=3):
         super().__init__()