Adapt metrics to vmap over the last axis

EtienneCmb · EtienneCmb · commit 6eb96b146598 · 2023-12-08T15:29:27.000+01:00
diff --git a/hoi/core/entropies.py b/hoi/core/entropies.py
@@ -22,7 +22,7 @@
 ###############################################################################
 
 
-def get_entropy(method="gcmi", **kwargs):
+def get_entropy(method="gcmi", vmap=False, **kwargs):
     """Get entropy function.
 
     Parameters
@@ -43,7 +43,10 @@ def get_entropy(method="gcmi", **kwargs):
     elif method == "binning":
         return partial(entropy_bin, **kwargs)
     elif method == "knn":
-        return partial(entropy_knn, **kwargs)
+        # wrap distance funtion with k
+        k = kwargs.get("k", 1)
+        cdist = partial(cdistk, k=k)
+        return partial(_entropy_knn, cdist=cdist, k=k)
     elif method == "kernel":
         return partial(entropy_kernel, **kwargs)
     else:
@@ -57,7 +60,7 @@ def get_entropy(method="gcmi", **kwargs):
 ###############################################################################
 
 
-def prepare_for_entropy(data, method, reshape=True, **kwargs):
+def prepare_for_entropy(data, method, **kwargs):
     """Prepare the data before computing entropy."""
     # data.shape = n_samples, n_features, n_variables
 
@@ -84,10 +87,6 @@ def prepare_for_entropy(data, method, reshape=True, **kwargs):
     elif method == "binning":
         pass
 
-    # make the data (n_variables, n_features, n_samples)
-    if reshape:
-        data = jnp.asarray(data.transpose(2, 1, 0))
-
     return data, kwargs
 
 
@@ -110,7 +109,7 @@ def entropy_gcmi(
     Parameters
     ----------
     x : array_like
-        Array of data of shape (n_features, n_samples)
+        Array of data of shape (n_samples, n_features)
     biascorrect : bool | False
         Specifies whether bias correction should be applied to the estimated MI
     demean : bool | False
@@ -121,14 +120,14 @@ def entropy_gcmi(
     hx : float
         Entropy of the gaussian variable (in bits)
     """
-    nfeat, nsamp = x.shape
+    nsamp, nfeat = x.shape
 
     # demean data
     if demean:
-        x = x - x.mean(axis=1, keepdims=True)
+        x = x - x.mean(axis=0, keepdims=True)
 
     # covariance
-    c = jnp.dot(x, x.T) / float(nsamp - 1)
+    c = jnp.dot(x.T, x) / float(nsamp - 1)
     chc = jnp.linalg.cholesky(c)
 
     # entropy in nats
@@ -218,7 +217,7 @@ def entropy_bin(x: jnp.array, base: int = 2) -> jnp.array:
     Parameters
     ----------
     x : array_like
-        Input data of shape (n_features, n_samples). The data should already
+        Input data of shape (n_samples, n_features). The data should already
         be discretize
     base : int | 2
         The logarithmic base to use. Default is base 2.
@@ -228,13 +227,13 @@ def entropy_bin(x: jnp.array, base: int = 2) -> jnp.array:
     hx : float
         Entropy of x
     """
-    n_features, n_samples = x.shape
+    n_samples, n_features = x.shape
     # here, we count the number of possible multiplets. The worst is that each
     # trial is unique. So we can prepare the output to be at most (n_samples,)
     # and if trials are repeated, just set to zero it's going to be compensated
     # by the entr() function
     counts = jnp.unique(
-        x, return_counts=True, size=n_samples, axis=1, fill_value=0
+        x, return_counts=True, size=n_samples, axis=0, fill_value=0
     )[1]
     probs = counts / n_samples
     return jax.scipy.special.entr(probs).sum() / np.log(base)
@@ -257,10 +256,10 @@ def set_to_inf(x, _):
 @partial(jax.jit, static_argnums=(2,))
 def cdistk(xx, idx, k=1):
     """K-th minimum euclidian distance."""
-    x, y = xx[:, [idx]], xx
+    x, y = xx[[idx], :], xx
 
     # compute euclidian distance
-    eucl = jnp.sqrt(jnp.sum((x - y) ** 2, axis=0))
+    eucl = jnp.sqrt(jnp.sum((x - y) ** 2, axis=1))
 
     # in case of 0-distances, replace them by infinity
     eucl = jnp.where(eucl == 0, jnp.inf, eucl)
@@ -271,8 +270,8 @@ def cdistk(xx, idx, k=1):
     return xx, eucl[jnp.argmin(eucl)]
 
 
-@partial(jax.jit, static_argnums=(1,))
-def entropy_knn(x: jnp.array, k: int = 1) -> jnp.array:
+@partial(jax.jit, static_argnums=(1, 2))
+def entropy_knn(x: jnp.array, k: int = 1, cdist=None) -> jnp.array:
     """Entropy using the k-nearest neighbor.
 
     Original code: https://github.com/blakeaw/Python-knn-entropy/
@@ -292,6 +291,14 @@ def entropy_knn(x: jnp.array, k: int = 1) -> jnp.array:
     hx : float
         Entropy of x
     """
+    # wrap cdist
+    cdist = partial(cdistk, k=k)
+    fcn = partial(_entropy_knn, cdist=cdist, k=k)
+    return fcn(x)
+
+
+@partial(jax.jit, static_argnums=(1, 2))
+def _entropy_knn(x: jnp.array, k: int = 1, cdist=None) -> jnp.array:
     # x = jnp.atleast_2d(x)
     d, n = float(x.shape[0]), float(x.shape[1])
 
@@ -330,14 +337,15 @@ def entropy_kernel(
     Parameters
     ----------
     x : array_like
-        Input data of shape (n_features, n_samples)
+        Input data of shape (n_samples, n_features)
 
     Returns
     -------
     hx : float
         Entropy of x
     """
-    model = gaussian_kde(x, bw_method=bw_method)
-    return -jnp.mean(jnp.log2(model(x)))
+    x_t = x.T
+    model = gaussian_kde(x_t, bw_method=bw_method)
+    return -jnp.mean(jnp.log2(model(x_t)))
     # p = model.pdf(x)
     # return jax.scipy.special.entr(p).sum() / np.log(base)
diff --git a/hoi/core/mi.py b/hoi/core/mi.py
@@ -70,8 +70,8 @@ def compute_mi(x, y, entropy_fcn=None):
     ----------
     x, y : array_like
         Arrays to consider for computing the Mutual Information. The two input
-        variables x and y should have a shape of (n_features_x, n_samples) and
-        (n_features_y, n_samples)
+        variables x and y should have a shape of (n_samples, n_features_x) and
+        (n_samples, n_features_y)
     entropy_fcn : function | None
         Function to use for computing the entropy.
 
@@ -84,6 +84,6 @@ def compute_mi(x, y, entropy_fcn=None):
     mi = (
         entropy_fcn(x)
         + entropy_fcn(y)
-        - entropy_fcn(jnp.concatenate((x, y), axis=0))
+        - entropy_fcn(jnp.concatenate((x, y), axis=1))
     )
     return mi
diff --git a/hoi/metrics/base_hoi.py b/hoi/metrics/base_hoi.py
@@ -182,7 +182,7 @@ def compute_entropies(
         # get entropy function
         entropy = partial(
             ent_at_index,
-            entropy=jax.vmap(get_entropy(method=method, **kwargs)),
+            entropy=jax.vmap(get_entropy(method=method, **kwargs), in_axes=2),
         )
 
         # ______________________________ ENTROPY ______________________________
diff --git a/hoi/metrics/dtc.py b/hoi/metrics/dtc.py
@@ -110,7 +110,7 @@ def fit(self, minsize=2, maxsize=None, method="gcmi", **kwargs):
         x, kwargs = prepare_for_entropy(self._x, method, **kwargs)
 
         # get entropy function
-        entropy = jax.vmap(get_entropy(method=method, **kwargs))
+        entropy = jax.vmap(get_entropy(method=method, **kwargs), in_axes=2)
         dtc_no_ent = partial(
             _dtc_no_ent,
             entropy_3d=entropy,
diff --git a/hoi/metrics/info_tot.py b/hoi/metrics/info_tot.py
@@ -77,7 +77,7 @@ def fit(self, minsize=2, maxsize=None, method="gcmi", **kwargs):
         x, y = self._split_xy(x)
 
         # prepare mi functions
-        mi_fcn = jax.vmap(get_mi(method=method, **kwargs))
+        mi_fcn = jax.vmap(get_mi(method=method, **kwargs), in_axes=2)
         compute_mi = partial(compute_mi_comb, mi=mi_fcn)
 
         # get multiplet indices and order
diff --git a/hoi/metrics/oinfo.py b/hoi/metrics/oinfo.py
@@ -21,10 +21,10 @@ def _oinfo_no_ent(inputs, index, entropy_3d=None, entropy_4d=None):
     # compute h(x^{n})
     h_xn = entropy_3d(x_c)
 
-    # compute \sum_{j=1}^{n} h(x_{j}
+    # compute \sum_{j=1}^{n} h(x_{j})
     h_xj_sum = entropy_4d(x_c[:, :, jnp.newaxis, :]).sum(0)
 
-    # compute \sum_{j=1}^{n} h(x_{-j}
+    # compute \sum_{j=1}^{n} h(x_{-j})
     h_xmj_sum = entropy_4d(x_c[:, acc, :]).sum(0)
 
     # compute oinfo
@@ -115,7 +115,7 @@ def fit(self, minsize=2, maxsize=None, method="gcmi", **kwargs):
         x, kwargs = prepare_for_entropy(self._x, method, **kwargs)
 
         # get entropy function
-        entropy = jax.vmap(get_entropy(method=method, **kwargs))
+        entropy = jax.vmap(get_entropy(method=method, **kwargs), in_axes=2)
         oinfo_no_ent = partial(
             _oinfo_no_ent,
             entropy_3d=entropy,
diff --git a/hoi/metrics/red_mmi.py b/hoi/metrics/red_mmi.py
@@ -74,7 +74,7 @@ def fit(self, minsize=2, maxsize=None, method="gcmi", **kwargs):
         x, y = self._split_xy(x)
 
         # prepare mi functions
-        mi_fcn = jax.vmap(get_mi(method=method, **kwargs))
+        mi_fcn = jax.vmap(get_mi(method=method, **kwargs), in_axes=2)
         compute_mi = partial(compute_mi_comb, mi=mi_fcn)
 
         # get multiplet indices and order
diff --git a/hoi/metrics/rsi.py b/hoi/metrics/rsi.py
@@ -101,7 +101,7 @@ def fit(self, minsize=2, maxsize=None, method="gcmi", **kwargs):
         x, y = self._split_xy(x)
 
         # prepare mi functions
-        mi_fcn = jax.vmap(get_mi(method=method, **kwargs))
+        mi_fcn = jax.vmap(get_mi(method=method, **kwargs), in_axes=2)
         compute_mi = partial(compute_mi_comb, mi=mi_fcn)
 
         # get multiplet indices and order
diff --git a/hoi/metrics/sinfo.py b/hoi/metrics/sinfo.py
@@ -111,7 +111,7 @@ def fit(self, minsize=2, maxsize=None, method="gcmi", **kwargs):
         x, kwargs = prepare_for_entropy(self._x, method, **kwargs)
 
         # get entropy function
-        entropy = jax.vmap(get_entropy(method=method, **kwargs))
+        entropy = jax.vmap(get_entropy(method=method, **kwargs), in_axes=2)
         sinfo_no_ent = partial(
             _sinfo_no_ent,
             entropy_3d=entropy,
diff --git a/hoi/metrics/syn_mmi.py b/hoi/metrics/syn_mmi.py
@@ -90,7 +90,7 @@ def fit(self, minsize=2, maxsize=None, method="gcmi", **kwargs):
         x, y = self._split_xy(x)
 
         # prepare mi functions
-        mi_fcn = jax.vmap(get_mi(method=method, **kwargs))
+        mi_fcn = jax.vmap(get_mi(method=method, **kwargs), in_axes=2)
         compute_mi = partial(compute_mi_comb, mi=mi_fcn)
         compute_syn = partial(_compute_syn, mi_fcn=compute_mi)
 
diff --git a/hoi/metrics/tc.py b/hoi/metrics/tc.py
@@ -110,7 +110,7 @@ def fit(self, minsize=2, maxsize=None, method="gcmi", **kwargs):
         x, kwargs = prepare_for_entropy(self._x, method, **kwargs)
 
         # get entropy function
-        entropy = jax.vmap(get_entropy(method=method, **kwargs))
+        entropy = jax.vmap(get_entropy(method=method, **kwargs), in_axes=2)
         tc_no_ent = partial(
             _tc_no_ent,
             entropy_3d=entropy,

Original file line number	Diff line number	Diff line change
`@@ -182,7 +182,7 @@ def compute_entropies(`
`182`	`182`	`# get entropy function`
`183`	`183`	`entropy = partial(`
`184`	`184`	`ent_at_index,`
`185`		`- entropy=jax.vmap(get_entropy(method=method, **kwargs)),`
	`185`	`+ entropy=jax.vmap(get_entropy(method=method, **kwargs), in_axes=2),`
`186`	`186`	`)`
`187`	`187`
`188`	`188`	`# ______________________________ ENTROPY ______________________________`