NeuralEnsemble · dizcza · Oct 23, 2020 · Oct 23, 2020 · Oct 24, 2020 · Oct 24, 2020
diff --git a/elephant/online.py b/elephant/online.py
@@ -0,0 +1,253 @@
+from copy import deepcopy
+
+import numpy as np
+import quantities as pq
+
+from elephant.statistics import isi
+
+msg_same_units = "Each batch must have the same units."
+
+
+class MeanOnline(object):
+    def __init__(self, batch_mode=False):
+        self.mean = None
+        self.count = 0
+        self.units = None
+        self.batch_mode = batch_mode
+
+    def update(self, new_val):
+        units = None
+        if isinstance(new_val, pq.Quantity):
+            units = new_val.units
+            new_val = new_val.magnitude
+        if self.batch_mode:
+            batch_size = new_val.shape[0]
+            new_val_sum = new_val.sum(axis=0)
+        else:
+            batch_size = 1
+            new_val_sum = new_val
+        self.count += batch_size
+        if self.mean is None:
+            self.mean = deepcopy(new_val_sum / batch_size)
+            self.units = units
+        else:
+            if units != self.units:
+                raise ValueError(msg_same_units)
+            self.mean += (new_val_sum - self.mean * batch_size) / self.count
+
+    def as_units(self, val):
+        if self.units is None:
+            return val
+        return pq.Quantity(val, units=self.units, copy=False)
+
+    def get_mean(self):
+        return self.as_units(deepcopy(self.mean))
+
+    def reset(self):
+        self.mean = None
+        self.count = 0
+        self.units = None
+
+
+class VarianceOnline(MeanOnline):
+    def __init__(self, batch_mode=False):
+        super(VarianceOnline, self).__init__(batch_mode=batch_mode)
+        self.variance_sum = 0.
+
+    def update(self, new_val):
+        units = None
+        if isinstance(new_val, pq.Quantity):
+            units = new_val.units
+            new_val = new_val.magnitude
+        if self.mean is None:
+            self.mean = 0.
+            self.variance_sum = 0.
+            self.units = units
+        elif units != self.units:
+            raise ValueError(msg_same_units)
+        delta_var = new_val - self.mean
+        if self.batch_mode:
+            batch_size = new_val.shape[0]
+            self.count += batch_size
+            delta_mean = new_val.sum(axis=0) - self.mean * batch_size
+            self.mean += delta_mean / self.count
+            delta_var *= new_val - self.mean
+            delta_var = delta_var.sum(axis=0)
+        else:
+            self.count += 1
+            self.mean += delta_var / self.count
+            delta_var *= new_val - self.mean
+        self.variance_sum += delta_var
+
+    def get_mean_std(self, unbiased=False):
+        if self.mean is None:
+            return None, None
+        if self.count > 1:
+            count = self.count - 1 if unbiased else self.count
+            std = np.sqrt(self.variance_sum / count)
+        else:
+            # with 1 update biased & unbiased sample variance is zero
+            std = 0.
+        mean = self.as_units(deepcopy(self.mean))
+        std = self.as_units(std)
+        return mean, std
+
+    def reset(self):
+        super(VarianceOnline, self).reset()
+        self.variance_sum = 0.
+
+
+class InterSpikeIntervalOnline(object):
+    def __init__(self, bin_size=0.0005, max_isi_value=1, batch_mode=False):
+        self.max_isi_value = max_isi_value  # in sec
+        self.last_spike_time = None
+        self.bin_size = bin_size  # in sec
+        self.num_bins = int(self.max_isi_value / self.bin_size)
+        self.bin_edges = np.linspace(start=0, stop=self.max_isi_value,
+                                     num=self.num_bins + 1)
+        self.current_isi_histogram = np.zeros(shape=self.num_bins)
+        self.bach_mode = batch_mode
+        self.units = None
+
+    def update(self, new_val):
+        units = None
+        if isinstance(new_val, pq.Quantity):
+            units = new_val.units
+            new_val = new_val.magnitude
+        if self.last_spike_time is None:  # for first batch
+            if self.bach_mode:
+                new_isi = isi(new_val)
+                self.last_spike_time = new_val[-1]
+            else:
+                new_isi = np.array([])
+                self.last_spike_time = new_val
+            self.units = units
+        else:  # for second to last batch
+            if units != self.units:
+                raise ValueError(msg_same_units)
+            if self.bach_mode:
+                new_isi = isi(np.append(self.last_spike_time, new_val))
+                self.last_spike_time = new_val[-1]
+            else:
+                new_isi = np.array([new_val - self.last_spike_time])
+                self.last_spike_time = new_val
+        isi_hist, _ = np.histogram(new_isi, bins=self.bin_edges)
+        self.current_isi_histogram += isi_hist
+
+    def as_units(self, val):
+        if self.units is None:
+            return val
+        return pq.Quantity(val, units=self.units, copy=False)
+
+    def get_isi(self):
+        return self.as_units(deepcopy(self.current_isi_histogram))
+
+    def reset(self):
+        self.last_spike_time = None
+        self.units = None
+        self.current_isi_histogram = np.zeros(shape=self.num_bins)
+
+
+class CovarianceOnline(object):
+    def __init__(self, batch_mode=False):
+        self.batch_mode = batch_mode
+        self.var_x = VarianceOnline(batch_mode=batch_mode)
+        self.var_y = VarianceOnline(batch_mode=batch_mode)
+        self.units = None
+        self.covariance_sum = 0.
+        self.count = 0
+
+    def update(self, new_val_pair):
+        units = None
+        if isinstance(new_val_pair, pq.Quantity):
+            units = new_val_pair.units
+            new_val_pair = new_val_pair.magnitude
+        if self.count == 0:
+            self.var_x.mean = 0.
+            self.var_y.mean = 0.
+            self.covariance_sum = 0.
+            self.units = units
+        elif units != self.units:
+            raise ValueError(msg_same_units)
+        if self.batch_mode:
+            self.var_x.update(new_val_pair[0])
+            self.var_y.update(new_val_pair[1])
+            delta_var_x = new_val_pair[0] - self.var_x.mean
+            delta_var_y = new_val_pair[1] - self.var_y.mean
+            delta_covar = delta_var_x * delta_var_y
+            batch_size = len(new_val_pair[0])
+            self.count += batch_size
+            delta_covar = delta_covar.sum(axis=0)
+            self.covariance_sum += delta_covar
+        else:
+            delta_var_x = new_val_pair[0] - self.var_x.mean
+            delta_var_y = new_val_pair[1] - self.var_y.mean
+            delta_covar = delta_var_x * delta_var_y
+            self.var_x.update(new_val_pair[0])
+            self.var_y.update(new_val_pair[1])
+            self.count += 1
+            self.covariance_sum += \
+                ((self.count - 1) / self.count) * delta_covar
+
+    def get_cov(self, unbiased=False):
+        if self.var_x.mean is None and self.var_y.mean is None:
+            return None
+        if self.count > 1:
+            count = self.count - 1 if unbiased else self.count
+            cov = self.covariance_sum / count
+        else:
+            cov = 0.
+        return cov
+
+    def reset(self):
+        self.var_x.reset()
+        self.var_y.reset()
+        self.units = None
+        self.covariance_sum = 0.
+        self.count = 0
+
+
+class PearsonCorrelationCoefficientOnline(object):
+    def __init__(self, batch_mode=False):
+        self.batch_mode = batch_mode
+        self.covariance_xy = CovarianceOnline(batch_mode=batch_mode)
+        self.units = None
+        self.R_xy = 0.
+        self.count = 0
+
+    def update(self, new_val_pair):
+        units = None
+        if isinstance(new_val_pair, pq.Quantity):
+            units = new_val_pair.units
+            new_val_pair = new_val_pair.magnitude
+        if self.count == 0:
+            self.covariance_xy.var_y.mean = 0.
+            self.covariance_xy.var_y.mean = 0.
+            self.units = units
+        elif units != self.units:
+            raise ValueError(msg_same_units)
+        self.covariance_xy.update(new_val_pair)
+        if self.batch_mode:
+            batch_size = len(new_val_pair[0])
+            self.count += batch_size
+        else:
+            self.count += 1
+        if self.count > 1:
+            self.R_xy = np.divide(
+                self.covariance_xy.covariance_sum,
+                (np.sqrt(self.covariance_xy.var_x.variance_sum *
+                 self.covariance_xy.var_y.variance_sum)))
+
+    def get_pcc(self):
+        if self.count == 0:
+            return None
+        elif self.count == 1:
+            return 0.
+        else:
+            return self.R_xy
+
+    def reset(self):
+        self.count = 0
+        self.units = None
+        self.R_xy = 0.
+        self.covariance_xy.reset()
diff --git a/elephant/signal_processing.py b/elephant/signal_processing.py
@@ -25,9 +25,8 @@
 import quantities as pq
 import scipy.signal
 
-from elephant.utils import deprecated_alias, check_same_units
-
-import warnings
+from elephant.online import VarianceOnline
+from elephant.utils import deprecated_alias, check_neo_consistency
 
 __all__ = [
     "zscore",
@@ -67,7 +66,7 @@ def zscore(signal, inplace=True):
         Signals for which to calculate the z-score.
     inplace : bool, optional
         If True, the contents of the input `signal` is replaced by the
-        z-transformed signal, if possible, i.e when the signal type is float.
+        z-transformed signal, if possible, i.e. when the signal type is float.
         If the signal type is not float, an error is raised.
         If False, a copy of the original `signal` is returned.
         Default: True
@@ -156,18 +155,19 @@ def zscore(signal, inplace=True):
     # Transform input to a list
     if isinstance(signal, neo.AnalogSignal):
         signal = [signal]
-    check_same_units(signal, object_type=neo.AnalogSignal)
+    check_neo_consistency(signal, object_type=neo.AnalogSignal)
 
-    # Calculate mean and standard deviation
-    signal_stacked = np.vstack(signal).magnitude
-    mean = signal_stacked.mean(axis=0)
-    std = signal_stacked.std(axis=0)
+    # Calculate mean and standard deviation vectors
+    online = VarianceOnline(batch_mode=True)
+    for sig in signal:
+        online.update(sig.magnitude)
+    mean, std = online.get_mean_std(unbiased=False)
 
     signal_ztransformed = []
     for sig in signal:
         # Perform inplace operation only if array is of dtype float.
         # Otherwise, raise an error.
-        if inplace and not np.issubdtype(np.float, sig.dtype):
+        if inplace and not np.issubdtype(float, sig.dtype):
             raise ValueError(f"Cannot perform inplace operation as the "
                              f"signal dtype is not float. Source: {sig.name}")
 
@@ -294,6 +294,9 @@ def cross_correlation_function(signal, channel_pairs, hilbert_envelope=False,
 
         If `scaleopt` is not one of the predefined above keywords.
 
+    .. bibliography::
+        :keyprefix: signal-
+
     Examples
     --------
     .. plot::
@@ -339,9 +342,8 @@ def cross_correlation_function(signal, channel_pairs, hilbert_envelope=False,
                          "indices. Cannot define pairs for cross-correlation.")
     if not isinstance(hilbert_envelope, bool):
         raise ValueError("'hilbert_envelope' must be a boolean value")
-    if n_lags is not None:
-        if not isinstance(n_lags, int) or n_lags <= 0:
-            raise ValueError('n_lags must be a non-negative integer')
+    if n_lags is not None and (not isinstance(n_lags, int) or n_lags <= 0):
+        raise ValueError('n_lags must be a non-negative integer')
 
     # z-score analog signal and store channel time series in different arrays
     # Cross-correlation will be calculated between xsig and ysig
@@ -581,7 +583,7 @@ def wavelet_transform(signal, frequency, n_cycles=6.0, sampling_frequency=1.0,
     Parameters
     ----------
     signal : (Nt, Nch) neo.AnalogSignal or np.ndarray or list
-        Time series data to be wavelet-transformed. When multi-dimensional
+        Time series data to be wavelet-transformed. When multidimensional
         `np.ndarray` or list is given, the time axis must be the last
         dimension. If `neo.AnalogSignal`, `Nt` is the number of time points
         and `Nch` is the number of channels.
@@ -673,7 +675,7 @@ def _morlet_wavelet_ft(freq, n_cycles, fs, n):
         # in Le van Quyen et al. J Neurosci Meth 111:83-98 (2001).
         sigma = n_cycles / (6. * freq)
         freqs = np.fft.fftfreq(n, 1.0 / fs)
-        heaviside = np.array(freqs > 0., dtype=np.float)
+        heaviside = np.array(freqs > 0., dtype=float)
         ft_real = np.sqrt(2 * np.pi * freq) * sigma * np.exp(
             -2 * (np.pi * sigma * (freqs - freq)) ** 2) * heaviside * fs
         ft_imag = np.zeros_like(ft_real)
@@ -717,7 +719,7 @@ def _morlet_wavelet_ft(freq, n_cycles, fs, n):
         n = n_orig
 
     # generate Morlet wavelets (in the frequency domain)
-    wavelet_fts = np.empty([len(freqs), n], dtype=np.complex)
+    wavelet_fts = np.empty([len(freqs), n], dtype=complex)
     for i, f in enumerate(freqs):
         wavelet_fts[i] = _morlet_wavelet_ft(f, n_cycles, sampling_frequency, n)
 
@@ -935,6 +937,7 @@ def rauc(signal, baseline=None, bin_duration=None, t_start=None, t_stop=None):
         raise ValueError('Input signal is not a neo.AnalogSignal!')
 
     if baseline is None:
+        # do nothing
         pass
     elif baseline == 'mean':
         # subtract mean from each channel

diff --git a/elephant/spike_train_correlation.py b/elephant/spike_train_correlation.py
@@ -379,7 +379,8 @@ def covariance(binned_spiketrain, binary=False, fast=True):
 
 
 @deprecated_alias(binned_sts='binned_spiketrain')
-def correlation_coefficient(binned_spiketrain, binary=False, fast=True):
+def correlation_coefficient(binned_spiketrain, binary=False, zero_diag=False,
+                            fast=True):
     r"""
     Calculate the NxN matrix of pairwise Pearson's correlation coefficients
     between all combinations of N binned spike trains.
@@ -418,6 +419,9 @@ def correlation_coefficient(binned_spiketrain, binary=False, fast=True):
         are counted as 1, resulting in binary binned vectors :math:`b_i`. If
         False, the binned vectors :math:`b_i` contain the spike counts per bin.
         Default: False
+    zero_diag : bool, optional
+        Zero-out the diagonal of a correlation matrix (True) or not (False).
+        Default: False
     fast : bool, optional
         If `fast=True` and the sparsity of `binned_spiketrain` is `> 0.1`, use
         `np.corrcoef()`. Otherwise, use memory efficient implementation.
@@ -481,10 +485,13 @@ def correlation_coefficient(binned_spiketrain, binary=False, fast=True):
 
     if fast and binned_spiketrain.sparsity > _SPARSITY_MEMORY_EFFICIENT_THR:
         array = binned_spiketrain.to_array()
-        return np.corrcoef(array)
+        corr_mat = np.corrcoef(array)
+    else:
+        corr_mat = _covariance_sparse(binned_spiketrain, corrcoef_norm=True)
 
-    return _covariance_sparse(
-        binned_spiketrain, corrcoef_norm=True)
+    if zero_diag:
+        np.fill_diagonal(corr_mat, 0)
+    return corr_mat
 
 
 def corrcoef(*args, **kwargs):