patched some tests/syn/neuron components, added sketch of bmm density

Alexander Ororbia · Alexander Ororbia · commit 4606a1c3375a · 2025-11-22T13:12:13.000-05:00
diff --git a/ngclearn/utils/density/__init__.py b/ngclearn/utils/density/__init__.py
@@ -1,2 +1,4 @@
 ## point to supported density estimator models
-from .gmm import GMM
+from .gmm import GMM ## Gaussian mixture 
+from .bmm import BMM ## Bernoulli mixture
+
diff --git a/ngclearn/utils/density/bmm.py b/ngclearn/utils/density/bmm.py
@@ -0,0 +1,206 @@
+from jax import numpy as jnp, random, jit, scipy
+from functools import partial
+import time, sys
+import numpy as np
+
+########################################################################################################################
+## internal routines for mixture model
+########################################################################################################################
+
+@partial(jit, static_argnums=[3])
+def _log_bernoulli_pdf(X, p):
+    """
+    Calculates the multivariate Bernoulli log likelihood of a design matrix/dataset `X`, under a given parameter 
+    probability `p`.
+
+    Args:
+        X: a design matrix (dataset) to compute the log likelihood of
+
+        mu: a parameter mean vector
+
+    Returns:
+        the log likelihood (scalar) of this design matrix X
+    """
+    D = mu.shape[1] * 1. ## get dimensionality
+    ## x log(mu_k) + (1-x) log(1 - mu_k)
+    vec_ll = X * jnp.log(p) + (1. - X) * jnp.log(1. - p) ## binary cross-entropy (log Bernoulli)
+    log_ll = jnp.sum(vec_ll, axis=1, keepdims=True) ## get per-datapoint LL
+    return log_ll
+
+@jit
+def _calc_bernoulli_pdf_vals(X, p):
+    log_ll = _log_bernoulli_pdf(X, p) ## get log-likelihood
+    ll = jnp.exp(log_ll) ## likelihood
+    return log_ll, ll
+
+@jit
+def _calc_priors_and_means(X, weights, pi): ## M-step co-routine
+    ## calc new means, responsibilities, and priors given current stats
+    N = X.shape[0]  ## get number of samples
+    ## calc responsibilities
+    r = (pi * weights)
+    r = r / jnp.sum(r, axis=1, keepdims=True) ## responsibilities
+    _pi = jnp.sum(r, axis=0, keepdims=True) / N ## calc new priors
+    ## calc weighted means (weighted by responsibilities)
+    means = jnp.matmul(r.T, X) / jnp.sum(r, axis=0, keepdims=True).T
+    return means, _pi, r
+
+@partial(jit, static_argnums=[1])
+def _sample_prior_weights(dkey, n_samples, pi): ## samples prior weighting parameters (of mixture)
+    log_pi = jnp.log(pi)  ## calc log(prior)
+    lats = random.categorical(dkey, logits=log_pi, shape=(n_samples, 1))  ## sample components/latents
+    return lats
+
+@partial(jit, static_argnums=[1])
+def _sample_component(dkey, n_samples, mu): ## samples a component (of mixture)
+    eps = random.bernoulli(dkey, p=mu, shape=(n_samples, mu.shape[1])) ## draw Bernoulli samples
+    return x_s
+
+########################################################################################################################
+
+class BMM: ## Bernoulli mixture model (mixture-of-Bernoullis)
+    """
+    Implements a Bernoulli mixture model (BMM) -- or mixture of Bernoullis (MoB).
+    Adaptation of parameters is conducted via the Expectation-Maximization (EM)
+    learning algorithm and leverages full covariance matrices in the component
+    multivariate Bernoulli distributions.
+
+    Note this is a (JAX) wrapper model that houses the sklearn implementation for learning.
+    The sampling process has been rewritten to utilize GPU matrix computation.
+
+    Args:
+        K: the number of components/latent variables within this BMM
+
+        max_iter: the maximum number of EM iterations to fit parameters to data (Default = 50)
+
+        init_kmeans: <Unsupported>
+    """
+
+    def __init__(self, K, max_iter=50, init_kmeans=False, key=None):
+        self.K = K
+        self.max_iter = int(max_iter)
+        self.init_kmeans = init_kmeans ## Unsupported currently
+        self.mu = [] ## component mean parameters
+        self.pi = None ## prior weight parameters
+        #self.z_weights = None # variables for parameterizing weights for SGD
+        self.key = random.PRNGKey(time.time_ns()) if key is None else key
+
+    def init(self, X):
+        """
+        Initializes this BMM in accordance to a supplied design matrix.
+
+        Args:
+            X: the design matrix to initialize this BMM to
+
+        """
+        dim = X.shape[1]
+        self.key, *skey = random.split(self.key, 3)
+        self.pi = jnp.ones((1, self.K)) / (self.K * 1.)
+        ptrs = random.permutation(skey[0], X.shape[0])
+        for j in range(self.K):
+            ptr = ptrs[j]
+            #self.key, *skey = random.split(self.key, 3)
+            self.mu.append(X[ptr:ptr+1,:] * 0 + (1./(dim * 1.)))
+
+    def calc_log_likelihood(self, X):
+        """
+        Calculates the multivariate Bernoulli log likelihood of a design matrix/dataset `X`, under the current
+        parameters of this Bernoulli mixture.
+
+        Args:
+            X: the design matrix to estimate log likelihood values over under this BMM
+
+        Returns:
+            (column) vector of individual log likelihoods, scalar for the complete log likelihood p(X)
+        """
+        ll = 0.
+        for j in range(self.K):
+            log_ll_j, ll_j = _calc_bernoulli_pdf_vals(X, self.mu[j])
+            ll = ll_j + ll
+        log_ll = jnp.log(ll) ## vector of individual log p(x_n) values
+        complete_ll = jnp.sum(log_ll) ## complete log-likelihood for design matrix X, i.e., log p(X)
+        return log_ll, complete_ll
+
+    def _E_step(self, X): ## Expectation (E) step, co-routine
+        weights = []
+        for j in range(self.K):
+            log_ll_j, ll_j = _calc_bernoulli_pdf_vals(X, self.mu[j])
+            weights.append( ll_j )
+        weights = jnp.concat(weights, axis=1)
+        return weights ## data-dependent weights (intermediate responsibilities)
+
+    def _M_step(self, X, weights): ## Maximization (M) step, co-routine
+        means, pi, r = _calc_priors_and_means(X, weights, self.pi)
+        self.pi = pi ## store new prior parameters
+        # calc weighted covariances
+        for j in range(self.K):
+            #r_j = r[:, j:j + 1]
+            mu_j = means[j:j + 1, :]
+            self.mu[j] = mu_j ## store new mean(j) parameter
+        return means, r
+
+    def fit(self, X, tol=1e-3, verbose=False):
+        """
+        Run full fitting process of this BMM.
+
+        Args:
+            X: the dataset to fit this BMM to
+
+            tol: the tolerance value for detecting convergence (via difference-of-means); will engage in early-stopping
+                if tol >= 0. (Default: 1e-3)
+
+            verbose: if True, this function will print out per-iteration measurements to I/O
+        """
+        means_prev = jnp.concat(self.mu, axis=0)
+        for i in range(self.max_iter):
+            self.update(X) ## carry out one E-step followed by an M-step
+            means = jnp.concat(self.mu, axis=0)
+            dom = jnp.linalg.norm(means - means_prev) ## norm of difference-of-means
+            if verbose:
+                print(f"{i}: Mean-diff = {dom}")
+            #print(jnp.linalg.norm(means - means_prev))
+            if tol >= 0. and dom < tol:
+                print(f"Converged after {i + 1} iterations.")
+                break
+            means_prev = means
+
+    def update(self, X):
+        """
+        Performs a single iterative update (E-step followed by M-step) of parameters (assuming model initialized)
+
+        Args:
+            X: the dataset / design matrix to fit this BMM to
+        """
+        r_w = self._E_step(X)  ## carry out E-step
+        means, respon = self._M_step(X, r_w) ## carry out M-step
+
+    def sample(self, n_samples, mode_j=-1):
+        """
+        Draw samples from the current underlying BMM model
+
+        Args:
+            n_samples: the number of samples to draw from this BMM
+
+            mode_j: if >= 0, will only draw samples from a specific component of this BMM
+                (Default = -1), ignoring the Categorical prior over latent variables/components
+
+        Returns:
+            Design matrix of samples drawn under the distribution defined by this BMM
+        """
+        ## sample prior
+        self.key, *skey = random.split(self.key, 3)
+        if mode_j >= 0: ## sample from a particular mode / component
+            mu_j = self.mu[mode_j]
+            Xs = _sample_component(skey[0], n_samples=n_samples, mu=mu_j)
+        else: ## sample from full mixture distribution
+            ## sample components/latents
+            lats = _sample_prior_weights(skey[0], n_samples=n_samples, pi=self.pi)
+            ## then sample chosen component Bernoulli
+            Xs = []
+            for j in range(self.K):
+                freq_j = int(jnp.sum((lats == j)))  ## compute frequency over mode
+                self.key, *skey = random.split(self.key, 3)
+                x_s = _sample_component(skey[0], n_samples=freq_j, mu=self.mu[j])
+                Xs.append(x_s)
+            Xs = jnp.concat(Xs, axis=0)
+        return Xs
diff --git a/ngclearn/utils/density/gmm.py b/ngclearn/utils/density/gmm.py
@@ -260,9 +260,8 @@ def sample(self, n_samples, mode_j=-1):
             Xs = []
             for j in range(self.K):
                 freq_j = int(jnp.sum((lats == j)))  ## compute frequency over mode
-                ## draw unit Gaussian noise
                 self.key, *skey = random.split(self.key, 3)
-                x_s = _sample_component(
+                x_s = _sample_component( ## now physically sample component
                     skey[0], n_samples=freq_j, mu=self.mu[j], Sigma=self.Sigma[j], assume_diag_cov=self.assume_diag_cov
                 )
                 Xs.append(x_s)
diff --git a/tests/components/neurons/graded/test_bernoulliErrorCell.py b/tests/components/neurons/graded/test_bernoulliErrorCell.py
@@ -39,7 +39,7 @@ def clamp_target(x):
       target_xt = jnp.array([[target_seq[0, ts]]])
       clamp_target(target_xt)
       advance_process.run(t=ts * 1., dt=dt)
-      outs.append(a.dp.value)
+      outs.append(a.dp.get())
   outs = jnp.concatenate(outs, axis=1)
   # print(outs)
   ## output should equal input
diff --git a/tests/components/neurons/graded/test_gaussianErrorCell.py b/tests/components/neurons/graded/test_gaussianErrorCell.py
@@ -44,8 +44,8 @@ def clamp_target(x):
       target_t = jnp.array([[target_seq[0, ts]]])
       clamp_target(target_t)
       advance_process.run(t=ts * 1., dt=dt)
-      dmu_outs.append(a.dmu.value)
-      L_outs.append(a.L.value)
+      dmu_outs.append(a.dmu.get())
+      L_outs.append(a.L.get())
 
   dmu_outs = jnp.concatenate(dmu_outs, axis=1)
   L_outs = jnp.array(L_outs)[None] # (1, 10)
@@ -58,4 +58,4 @@ def clamp_target(x):
   np.testing.assert_allclose(dmu_outs, expected_dmu, atol=1e-5)
   np.testing.assert_allclose(L_outs, expected_L, atol=1e-5)
 
-# test_gaussianErrorCell()
+# test_gaussianErrorCell()
diff --git a/tests/components/synapses/hebbian/test_traceSTDPSynapse.py b/tests/components/synapses/hebbian/test_traceSTDPSynapse.py
@@ -4,7 +4,7 @@
 np.random.seed(42)
 
 from ngclearn import Context, MethodProcess
-import ngclearn.utils.weight_distribution as dist
+#import ngclearn.utils.weight_distribution as dist
 from ngclearn.components.synapses.hebbian.traceSTDPSynapse import TraceSTDPSynapse
 from numpy.testing import assert_array_equal
 
diff --git a/tests/components/synapses/modulated/test_MSTDPETSynapse.py b/tests/components/synapses/modulated/test_MSTDPETSynapse.py
@@ -4,7 +4,7 @@
 np.random.seed(42)
 
 from ngclearn import Context, MethodProcess
-import ngclearn.utils.weight_distribution as dist
+#import ngclearn.utils.weight_distribution as dist
 from ngclearn.components.synapses.modulated.MSTDPETSynapse import MSTDPETSynapse
 from numpy.testing import assert_array_equal
 
diff --git a/tests/components/synapses/test_STPDenseSynapse.py b/tests/components/synapses/test_STPDenseSynapse.py
@@ -4,7 +4,7 @@
 np.random.seed(42)
 
 from ngclearn import Context, MethodProcess
-import ngclearn.utils.weight_distribution as dist
+from ngclearn.utils.distribution_generator import DistributionGenerator
 from ngclearn.components.synapses.STPDenseSynapse import STPDenseSynapse
 
 def test_STPDenseSynapse1():
@@ -16,7 +16,7 @@ def test_STPDenseSynapse1():
     # ---- build a simple Poisson cell system ----
     with Context(name) as ctx:
         a = STPDenseSynapse(
-            name="a", shape=(1,1), resources_init=dist.constant(value=1.),key=subkeys[0]
+            name="a", shape=(1,1), resources_init=DistributionGenerator.constant(value=1.),key=subkeys[0]
         )
 
         advance_process = (MethodProcess("advance_proc")
diff --git a/tests/components/synapses/test_exponentialSynapse.py b/tests/components/synapses/test_exponentialSynapse.py
@@ -4,7 +4,7 @@
 np.random.seed(42)
 
 from ngclearn import Context, MethodProcess
-import ngclearn.utils.weight_distribution as dist
+from ngclearn.utils.distribution_generator import DistributionGenerator
 from ngclearn.components.synapses.exponentialSynapse import ExponentialSynapse
 
 def test_exponentialSynapse1():
@@ -19,8 +19,8 @@ def test_exponentialSynapse1():
     # ---- build a single exp-synapse system ----
     with Context(name) as ctx:
         a = ExponentialSynapse(
-            name="a", shape=(1,1), tau_decay=tau_syn, g_syn_bar=2.4, syn_rest=E_rest, weight_init=dist.constant(value=1.),
-            key=subkeys[0]
+            name="a", shape=(1,1), tau_decay=tau_syn, g_syn_bar=2.4, syn_rest=E_rest, 
+            weight_init=DistributionGenerator.constant(value=1.), key=subkeys[0]
         )
 
         advance_process = (MethodProcess("advance_proc")