minor edits/updates

Alexander Ororbia · Alexander Ororbia · commit abe7dfa78b7e · 2026-05-20T00:37:27.000-04:00
diff --git a/ngclearn/components/synapses/hebbian/gerstnerHebbianSynapse.py b/ngclearn/components/synapses/hebbian/gerstnerHebbianSynapse.py
@@ -0,0 +1,113 @@
+import jax.numpy as jnp
+from jax import random, jit
+
+from ngclearn import compilable
+from ngclearn import Compartment
+from ngclearn.components.synapses import DenseSynapse
+from ngclearn.utils import tensorstats
+from ngcsimlib import deprecate_args
+#from ngclearn.utils.io_utils import save_pkl, load_pkl
+
+class GerstnerHebbianSynapse(DenseSynapse):
+    """
+    A synapse component that implements Gerstner's general Hebbian
+    learning (Taylor) expansion (Equation 3 from Gerstner & Kistler, 2002).
+
+    Note that this synpatic update model can recover several classical forms
+    of Hebbian-like update rules, including the covariance rule.
+
+    There are other higher-order terms possible, i.e., \Theta(xy), such as
+    x * y2 and y x^2, etc.
+
+    | c2_corr > 0 and c0 = c1_pre = c1_post = 0 => Hebbian update
+    | c2_corr < 0 and c0 = c1_pre = c1_post = 0 => anti-Hebbian update
+    | c2_corr = 1 and c1_pre = -x_theta < 0
+
+    """
+    def __init__(
+        self,
+        name,
+        shape, ## (post_dim, pre_dim)
+        eta=0.01, ## global step-size
+        coeffs=None, ## these configure which kind of Hebb learning is done
+        weight_init=None,
+        p_conn=1.,
+        resist_scale=1.,
+        sign_value=1.,
+        batch_size=1,
+        **kwargs
+    ):
+        bias_init = None ## no biases are included in Gerster's formulation
+        super().__init__(
+            name,
+            shape=shape,
+            weight_init=weight_init,
+            bias_init=bias_init,
+            resist_scale=resist_scale,
+            p_conn=p_conn,
+            batch_size=batch_size,
+            **kwargs
+        )
+        ## General Hebbian meta-parameters
+        self.eta = eta
+        self.sign_value = sign_value
+
+        ## Expansion coefficients (c0, c1_pre, c1_post, c2_corr)
+        if coeffs is None: ## Default to standard bilinear Hebb
+            self.coeffs = {
+                'c0': 0., 'c1_pre': 0., 'c1_post': 0., 'c2_corr': 1.0
+            }
+        else:
+            self.coeffs = coeffs
+        self.c0 = self.coeffs['c0']
+        self.c1_pre = self.coeffs['c1_pre']
+        self.c1_post = self.coeffs['c1_post']
+        self.c2_corr = self.coeffs['c2_corr']
+
+        # Initialize Weights (using JAX PRNG)
+        #init_key, _ = random.split(self.key)
+        #w_init = random.normal(init_key, shape) * 0.05
+
+        # Compartments (ngc-learn state management)
+        #self.weights = Compartment(w_init)
+        self.pre = Compartment(jnp.zeros((1, shape[1])))
+        self.post = Compartment(jnp.zeros((1, shape[0])))
+
+    @compilable
+    def evolve(self, **kwargs):
+        """
+        Updates weights using the Gerstner general expansion.
+        Assumes pre_act and post_act compartments have been populated.
+        """
+        # Retrieve current states
+        W = self.weights.get()
+        x = self.pre.get()  # pre-synaptic activity (batch, pre_dim)
+        y = self.post.get() # post-synaptic activity (batch, post_dim)
+        batch_size = self.batch_size
+
+        ## Bilinear Term (c2): correlation matrix
+        ### (post_dim, batch) @ (batch, pre_dim) -> (post_dim, pre_dim)
+        dW_corr = jnp.matmul(x.T, y) * (1./batch_size)
+        ## Linear pre-synaptic term (c1_pre)
+        ### Average over batch then broadcast to match weight matrix
+        dW_pre = jnp.sum(x, axis=0, keepdims=True).T * (1./batch_size)
+        ## Linear post-synaptic term (c1_post)
+        dW_post = jnp.sum(y, axis=0, keepdims=True) * (1./batch_size)
+
+        ## Apply Equation 3 Taylor expansion
+        dW = (self.c0 * W +  ## synaptic decay
+              self.c1_pre * dW_pre +  ## bilinear term
+              self.c1_post * dW_post +  ## pre-synaptic gating term
+              self.c2_corr * dW_corr  ## post-synpatic gating term
+        )
+        ## perform a step of Hebbian ascent
+        W = W + self.eta * dW
+        ## Update weights
+        self.weights.set(W)
+
+    @compilable
+    def reset(self, **kwargs):
+        """Clears activity compartments"""
+        self.pre.set( jnp.zeros((self.batch_size, self.shape[1])) )
+        self.post.set( jnp.zeros((self.batch_size, self.shape[0])) )
+
diff --git a/ngclearn/utils/filters/gauss_filter.py b/ngclearn/utils/filters/gauss_filter.py
@@ -2,7 +2,6 @@
 from jax import lax, jit
 from functools import partial
 
-
 def _calc_gaussian_kernel_2D( ## internal co-routine
         sigma: float,
         radius: int
@@ -21,7 +20,8 @@ def gaussian_filter(
         sigma_center: float, ## sigma1
         sigma_surround: float, ## sigma2
         kernel_size : int, ## radius
-        use_ratio=False ## if True, this becomes a ratio-of-Gaussians
+        use_ratio=False, ## if True, this becomes a ratio-of-Gaussians
+        edge_pad_mode="edge" ## "reflect"
 ) -> jnp.ndarray:
     """
     Applies a difference-of-Gaussians filter to a batch of 2D images (of CxHxW tensor shape).
@@ -40,27 +40,38 @@ def gaussian_filter(
     Returns:
         An output tensor of shape (B, C, H, W)
     """
-    x = images
+    ## Pad spatial dimensions (H, W) using edge-clamping to remove artifacts
+    # Format for 4D (B, C, H, W): ((Before_B, After_B), (Before_C, After_C), (Before_H, After_H), (Before_W, After_W))
+    padding_config = ((0, 0), (0, 0), (kernel_size, kernel_size), (kernel_size, kernel_size))
+    padded_x = jnp.pad(images, padding_config, mode=edge_pad_mode)
+
     ## Construct two 2D Gaussian kernels
     k1 = _calc_gaussian_kernel_2D(sigma_center, kernel_size) ## center kernel
     k2 = _calc_gaussian_kernel_2D(sigma_surround, kernel_size) ## surround kernel
+
     ## Define dimension ordering for lax.conv ('NCHW' standard layout)
     dn = lax.ConvDimensionNumbers(
         lhs_spec=(0, 1, 2, 3), ## (batch, channel, height, width)
         rhs_spec=(0, 1, 2, 3), ## (out_channel, in_channel, height, width)
         out_spec=(0, 1, 2, 3)  ## (batch, channel, height, width)
     )
-    ## Perform spatial convolutions w/ edge padding to emulate 'SAME' behavior
+
+    ## Extract channel count dynamically for independent channel-wise filtering
+    num_channels = images.shape[1]
+
+    ## Perform spatial convolutions w/ 'VALID' padding on the edge-padded input
     blur_center = lax.conv_general_dilated(
-        x, k1, window_strides=(1, 1), padding=[(kernel_size, kernel_size), (kernel_size, kernel_size)], dimension_numbers=dn
+        padded_x, k1, window_strides=(1, 1), padding='VALID', dimension_numbers=dn, feature_group_count=num_channels
     )
     blur_surround = lax.conv_general_dilated(
-        x, k2, window_strides=(1, 1), padding=[(kernel_size, kernel_size), (kernel_size, kernel_size)], dimension_numbers=dn
+        padded_x, k2, window_strides=(1, 1), padding='VALID', dimension_numbers=dn, feature_group_count=num_channels
     )
+
     ## Perform final filter calculation
     if use_ratio:
         eps = 1e-5
-        output = blur_center / (blur_surround + eps) ## Compute kernel difference
+        output = blur_center / (blur_surround + eps) ## Compute kernel ratio
     else:
-        output = blur_center - blur_surround ## Compute kernel ratio
+        output = blur_center - blur_surround ## Compute kernel difference
     return output ## shape: (B, C, H, W)
+