Merge pull request #22 from olivercliff/directed_info_fix

olivercliff · web-flow · commit a4818f4acceb · 2023-01-10T20:59:11.000+11:00
Modify Directed info to use the causal entropy rate
diff --git a/demos/simple_demo.py b/demos/simple_demo.py
@@ -1,4 +1,4 @@
-""" This simple demo will show you how to quickly get started with evaluating all SPIs.
+""" This simple demo will show you how to quickly get started with PySPI.
 """
 import numpy as np
 from pyspi.calculator import Calculator
diff --git a/pyspi/config.yaml b/pyspi/config.yaml
@@ -103,12 +103,12 @@
   MultiscaleGraphCorrelation:
 
   # Hilbert-Schmidt independence criterion
-  HSIC:
+  HilbertSchmidtIndependenceCriterion:
     - biased: False
     - biased: True
 
   # Heller-Heller-Gorfine (HHG) test
-  HHG:
+  HellerHellerGorfine:
 
   # Multi-scale graph correlation for time series
   CrossMultiscaleGraphCorrelation:
@@ -367,7 +367,7 @@
       k_history: 10
       l_history: 1
 
-  IntegratedInfo:
+  IntegratedInformation:
     - phitype: "star"
 
     - phitype: "star"
diff --git a/pyspi/data.py b/pyspi/data.py
@@ -8,8 +8,6 @@
 from scipy.stats import zscore
 from scipy.signal import detrend
 import os
-from sktime.utils.data_io import load_from_tsfile_to_dataframe
-from sktime.datatypes._panel._convert import from_nested_to_3d_numpy
 
 VERBOSE = False
 
@@ -131,7 +129,10 @@ def convert_to_numpy(data):
             elif ext == ".csv":
                 npdat = np.genfromtxt(data, ",")
             elif ext == ".ts":
-                tsdat, tsclasses = load_from_tsfile_to_dataframe(data)
+                from sktime.utils.data_io import load_from_tsfile_to_dataframe
+                from sktime.datatypes._panel._convert import from_nested_to_3d_numpy
+
+                tsdat, _ = load_from_tsfile_to_dataframe(data)
                 npdat = from_nested_to_3d_numpy(tsdat)
             else:
                 raise TypeError(f"Unknown filename extension: {ext}")
diff --git a/pyspi/fast_config.yaml b/pyspi/fast_config.yaml
@@ -83,7 +83,7 @@
     - biased: True
 
   # Hilbert-Schmidt independence criterion
-  HSIC:
+  HilbertSchmidtIndependenceCriterion:
     - biased: False
     - biased: True
 
diff --git a/pyspi/statistics/distance.py b/pyspi/statistics/distance.py
@@ -44,7 +44,7 @@ def multivariate(self, data):
 """
 
 
-class HSIC(Undirected, Unsigned):
+class HilbertSchmidtIndependenceCriterion(Undirected, Unsigned):
     """Hilbert-Schmidt Independence Criterion (HSIC)"""
 
     name = "Hilbert-Schmidt Independence Criterion"
@@ -63,7 +63,7 @@ def bivariate(self, data, i=None, j=None):
         return stat
 
 
-class HHG(Directed, Unsigned):
+class HellerHellerGorfine(Directed, Unsigned):
     """Heller-Heller-Gorfine independence criterion"""
 
     name = "Heller-Heller-Gorfine Independence Criterion"
diff --git a/pyspi/statistics/infotheory.py b/pyspi/statistics/infotheory.py
@@ -72,17 +72,13 @@ def __init__(
 
     def __getstate__(self):
         state = dict(self.__dict__)
-        try:
-            del state["_entropy_calc"]
-        except KeyError:
-            pass
-        try:
-            del state["_calc"]
-        except KeyError:
-            pass
 
-        if "_entropy_calc" in state.keys() or "_calc" in state.keys():
-            logging.info(f"{self.identifier} contains a calculator still")
+        unserializable_objects = ["_entropy_calc", "_calc"]
+
+        for k in unserializable_objects:
+            if k in state.keys():
+                del state[k]
+
         return state
 
     def __setstate__(self, state):
@@ -161,54 +157,49 @@ def _compute_entropy(self, data, i=None):
 
         if data.entropy[key][i] == -np.inf:
             x = np.squeeze(data.to_numpy()[i])
+
             self._entropy_calc.initialise(1)
             self._entropy_calc.setObservations(jp.JArray(jp.JDouble, 1)(x))
+
             data.entropy[key][
                 i
             ] = self._entropy_calc.computeAverageLocalOfObservations()
 
         return data.entropy[key][i]
 
-    # No Theiler window yet (can it be done?)
+    # No Theiler window is available in the JIDT estimator
     @parse_bivariate
-    def _compute_JointEntropy(self, data, i, j):
-        if not hasattr(data, "JointEntropy"):
-            data.JointEntropy = {}
+    def _compute_joint_entropy(self, data, i, j):
+        if not hasattr(data, "joint_entropy"):
+            data.joint_entropy = {}
 
         key = self._getkey()
-        if key not in data.JointEntropy:
-            data.JointEntropy[key] = np.full(
-                (data.n_processes, data.n_processes), -np.inf
-            )
+        if key not in data.joint_entropy:
+            data.joint_entropy[key] = np.full((data.n_processes, data.n_processes), -np.infty)
 
-        if data.JointEntropy[key][i, j] == -np.inf:
+        if data.joint_entropy[key][i, j] == -np.inf:
             x, y = data.to_numpy()[[i, j]]
 
             self._entropy_calc.initialise(2)
-            self._entropy_calc.setObservations(
-                jp.JArray(jp.JDouble, 2)(np.concatenate([x, y], axis=1))
-            )
-            data.JointEntropy[key][
-                i, j
-            ] = self._entropy_calc.computeAverageLocalOfObservations()
-            data.JointEntropy[key][j, i] = data.JointEntropy[key][i, j]
+            self._entropy_calc.setObservations(jp.JArray(jp.JDouble, 2)(np.concatenate([x, y], axis=1)))
 
-        return data.JointEntropy[key][i, j]
+            data.joint_entropy[key][i, j] = self._entropy_calc.computeAverageLocalOfObservations()
+            data.joint_entropy[key][j, i] = data.joint_entropy[key][i, j]
 
-    # No Theiler window yet (can it be done?)
-    """
-    TODO: match this function with previous ones (perhaps always allow multiple i's and j's)
-    """
+        return data.joint_entropy[key][i, j]
 
+    # No Theiler window is available in the JIDT estimator
     def _compute_conditional_entropy(self, X, Y):
         XY = np.concatenate([X, Y], axis=1)
 
         self._entropy_calc.initialise(XY.shape[1])
         self._entropy_calc.setObservations(jp.JArray(jp.JDouble, XY.ndim)(XY))
+
         H_XY = self._entropy_calc.computeAverageLocalOfObservations()
 
         self._entropy_calc.initialise(Y.shape[1])
         self._entropy_calc.setObservations(jp.JArray(jp.JDouble, Y.ndim)(Y))
+
         H_Y = self._entropy_calc.computeAverageLocalOfObservations()
 
         return H_XY - H_Y
@@ -218,12 +209,14 @@ def _set_theiler_window(self, data, i, j):
             if not hasattr(data, "theiler"):
                 z = data.to_numpy()
                 theiler_window = -np.ones((data.n_processes, data.n_processes))
+
                 # Compute effective sample size for each pair
                 for _i in range(data.n_processes):
                     targ = z[_i]
                     for _j in range(_i + 1, data.n_processes):
                         src = z[_j]
-                        # Init the Theiler window using Bartlett's formula
+
+                        # Initialize the Theiler window using Bartlett's formula
                         theiler_window[_i, _j] = 2 * np.dot(
                             utils.acf(src), utils.acf(targ)
                         )
@@ -250,7 +243,7 @@ def __init__(self, **kwargs):
 
     @parse_bivariate
     def bivariate(self, data, i=None, j=None):
-        return self._compute_JointEntropy(data, i=i, j=j)
+        return self._compute_joint_entropy(data, i=i, j=j)
 
 
 class ConditionalEntropy(JIDTBase, Directed):
@@ -264,7 +257,7 @@ def __init__(self, **kwargs):
 
     @parse_bivariate
     def bivariate(self, data, i=None, j=None):
-        return self._compute_JointEntropy(data, i=i, j=j) - self._compute_entropy(
+        return self._compute_joint_entropy(data, i=i, j=j) - self._compute_entropy(
             data, i=i
         )
 
@@ -456,40 +449,41 @@ def __init__(self, n=5, **kwargs):
         self._n = n
 
     def _compute_causal_entropy(self, src, targ):
-        mUtils = jp.JPackage("infodynamics.utils").MatrixUtils
-        H = 0
+
         src = np.squeeze(src)
         targ = np.squeeze(targ)
-        for i in range(2, self._n):
-            Yp = mUtils.makeDelayEmbeddingVector(jp.JArray(jp.JDouble, 1)(targ), i - 1)[
-                1:
-            ]
-            Xp = mUtils.makeDelayEmbeddingVector(jp.JArray(jp.JDouble, 1)(src), i)
+
+        m_utils = jp.JPackage("infodynamics.utils").MatrixUtils
+
+        causal_entropy = 0
+        for i in range(1, self._n + 1):
+            Yp = m_utils.makeDelayEmbeddingVector(jp.JArray(jp.JDouble, 1)(targ), i - 1)[:-1]
+            Xp = m_utils.makeDelayEmbeddingVector(jp.JArray(jp.JDouble, 1)(src), i)
             XYp = np.concatenate([Yp, Xp], axis=1)
 
             Yf = np.expand_dims(targ[i - 1 :], 1)
-            H = H + self._compute_conditional_entropy(Yf, XYp)
-        return H
+            causal_entropy = causal_entropy + self._compute_conditional_entropy(Yf, XYp)
+        return causal_entropy
 
     def _getkey(self):
         return super(CausalEntropy, self)._getkey() + (self._n,)
 
     @parse_bivariate
     def bivariate(self, data, i=None, j=None):
-        if not hasattr(data, "CausalEntropy"):
-            data.CausalEntropy = {}
+        if not hasattr(data, "causal_entropy"):
+            data.causal_entropy = {}
 
         key = self._getkey()
-        if key not in data.CausalEntropy:
-            data.CausalEntropy[key] = np.full(
+        if key not in data.causal_entropy:
+            data.causal_entropy[key] = np.full(
                 (data.n_processes, data.n_processes), -np.inf
             )
 
-        if data.CausalEntropy[key][i, j] == -np.inf:
+        if data.causal_entropy[key][i, j] == -np.inf:
             z = data.to_numpy(squeeze=True)
-            data.CausalEntropy[key][i, j] = self._compute_causal_entropy(z[i], z[j])
+            data.causal_entropy[key][i, j] = self._compute_causal_entropy(z[i], z[j])
 
-        return data.CausalEntropy[key][i, j]
+        return data.causal_entropy[key][i, j]
 
 
 class DirectedInfo(CausalEntropy, Directed):
@@ -498,18 +492,34 @@ class DirectedInfo(CausalEntropy, Directed):
     identifier = "di"
     labels = ["unsigned", "infotheory", "temporal", "directed"]
 
-    def __init__(self, n=10, **kwargs):
+    def __init__(self, n=5, **kwargs):
         super().__init__(**kwargs)
         self._n = n
 
+    def _compute_entropy_rates(self, targ):
+
+        targ = np.squeeze(targ)
+        m_utils = jp.JPackage("infodynamics.utils").MatrixUtils
+
+        entropy_rate_sum = 0
+        for i in range(1, self._n + 1):
+            # Compute entropy for an i-dimensional embedding
+            self._entropy_calc.initialise(i)
+
+            Yi = m_utils.makeDelayEmbeddingVector(jp.JArray(jp.JDouble, 1)(targ), i)
+            self._entropy_calc.setObservations(Yi)
+            entropy_rate_sum = entropy_rate_sum + self._entropy_calc.computeAverageLocalOfObservations() / i
+
+        return entropy_rate_sum
+
     @parse_bivariate
     def bivariate(self, data, i=None, j=None):
         """Compute directed information from i to j"""
-        # Would prefer to match these two calls
-        entropy = self._compute_entropy(data, j)
-        CausalEntropy = super(DirectedInfo, self).bivariate(data, i=i, j=j)
 
-        return entropy - CausalEntropy
+        entropy_rates = self._compute_entropy_rates(data.to_numpy(squeeze=True)[j])
+        causal_entropy = super().bivariate(data, i=i, j=j)
+
+        return entropy_rates - causal_entropy
 
 
 class StochasticInteraction(JIDTBase, Undirected):
@@ -536,7 +546,7 @@ def bivariate(self, data, i=None, j=None, verbose=False):
         return H_src + H_targ - H_joint
 
 
-class IntegratedInfo(Undirected, Unsigned):
+class IntegratedInformation(Undirected, Unsigned):
 
     name = "Integrated information"
     identifier = "phi"
@@ -552,7 +562,7 @@ def __init__(self, phitype="star", delay=1, normalization=0):
         self.identifier += f"_{phitype}_t-{delay}_norm-{normalization}"
 
     @parse_bivariate
-    def bivariate(self, data, i=None, j=None, verbose=False):
+    def bivariate(self, data, i=None, j=None):
 
         if not octave.exist("phi_comp"):
             path = os.path.dirname(os.path.abspath(__file__)) + "/../lib/PhiToolbox/"
diff --git a/pyspi/statistics/misc.py b/pyspi/statistics/misc.py
@@ -72,11 +72,13 @@ def _from_cache(self, data, i, j):
                     maxlag=self._maxlag,
                     trend=self._trend,
                 )
+
                 ci = {"tstat": stats[0]}
             else:
                 stats = coint_johansen(
                     z[[i, j]].T, det_order=self._det_order, k_ar_diff=self._k_ar_diff
                 )
+
                 ci = {
                     "max_eig_stat": stats.max_eig_stat[0],
                     "trace_stat": stats.trace_stat[0],
diff --git a/setup.py b/setup.py
@@ -66,7 +66,7 @@
                         'data/cml.npy',
                         'data/forex.npy']},
     include_package_data=True,
-    version='0.2.2',
+    version='0.4.0',
     description='Network analysis for time series',
     author='Oliver M. Cliff',
     author_email='oliver.m.cliff@gmail.com',

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-""" This simple demo will show you how to quickly get started with evaluating all SPIs.`
	`1`	`+""" This simple demo will show you how to quickly get started with PySPI.`
`2`	`2`	`"""`
`3`	`3`	`import numpy as np`
`4`	`4`	`from pyspi.calculator import Calculator`
Original file line number	Diff line number	Diff line change
`@@ -72,11 +72,13 @@ def _from_cache(self, data, i, j):`
`72`	`72`	`maxlag=self._maxlag,`
`73`	`73`	`trend=self._trend,`
`74`	`74`	`)`
	`75`	`+`
`75`	`76`	`ci = {"tstat": stats[0]}`
`76`	`77`	`else:`
`77`	`78`	`stats = coint_johansen(`
`78`	`79`	`z[[i, j]].T, det_order=self._det_order, k_ar_diff=self._k_ar_diff`
`79`	`80`	`)`
	`81`	`+`
`80`	`82`	`ci = {`
`81`	`83`	`"max_eig_stat": stats.max_eig_stat[0],`
`82`	`84`	`"trace_stat": stats.trace_stat[0],`