From 6a969153d3e5bb0e6d86959882b35faa9cc93121 Mon Sep 17 00:00:00 2001
From: nbara <10333715+nbara@users.noreply.github.com>
Date: Tue, 10 Nov 2020 11:10:32 +0100
Subject: [PATCH 1/7] [FIX][ENH] Add regularization option for ASR

---
 meegkit/asr.py               | 63 +++++++++++++++++++++---------------
 meegkit/utils/asr.py         | 19 +++++------
 meegkit/utils/covariances.py | 13 +++++---
 tests/test_asr.py            | 45 ++++++++++++++++++--------
 4 files changed, 88 insertions(+), 52 deletions(-)

diff --git a/meegkit/asr.py b/meegkit/asr.py
index f2a6c0d9..86a524f3 100755
--- a/meegkit/asr.py
+++ b/meegkit/asr.py
@@ -2,11 +2,10 @@
 import logging
 
 import numpy as np
-
 from scipy import linalg, signal
 from statsmodels.robust.scale import mad
 
-from .utils import nonlinear_eigenspace, block_covariance
+from .utils import block_covariance, nonlinear_eigenspace
 from .utils.asr import (block_geometric_median, fit_eeg_distribution, yulewalk,
                         yulewalk_filter)
 
@@ -64,6 +63,9 @@ class ASR():
         ASR [2]_.
     memory : float
         Memory size (s), regulates the number of covariance matrices to store.
+    estimator : str in {'scm', 'lwf', 'oas', 'mcd'}
+        Covariance estimator (default: 'scm' which computes the sample
+        covariance). Use 'lwf' if you need regularization (requires pyriemann).
 
     Attributes
     ----------
@@ -102,7 +104,7 @@ class ASR():
     def __init__(self, sfreq=250, cutoff=5, blocksize=10, win_len=0.5,
                  win_overlap=0.66, max_dropout_fraction=0.1,
                  min_clean_fraction=0.25, name='asrfilter', method='euclid',
-                 **kwargs):
+                 estimator='scm', **kwargs):
 
         if pyriemann is None and method == 'riemann':
             logging.warning('Need pyriemann to use riemannian ASR flavor.')
@@ -118,6 +120,7 @@ def __init__(self, sfreq=250, cutoff=5, blocksize=10, win_len=0.5,
         self.method = method
         self.memory = 1 * sfreq  # smoothing window for covariances
         self.sfreq = sfreq
+        self.estimator = estimator
 
         # Initialise yulewalk-filter coefficients with sensible defaults
         F = np.array([0, 2, 3, 13, 16, 40, np.minimum(
@@ -186,7 +189,8 @@ def fit(self, X, y=None, **kwargs):
             win_overlap=self.win_overlap,
             max_dropout_fraction=self.max_dropout_fraction,
             min_clean_fraction=self.min_clean_fraction,
-            method=self.method)
+            method=self.method,
+            estimator=self.estimator)
 
         self.state_ = dict(M=M, T=T, R=None)
         self._fitted = True
@@ -212,17 +216,23 @@ def transform(self, X, y=None, **kwargs):
                 out = self.transform(X[0])
                 return out[None, ...]
             else:
-                return X
-
-        # Yulewalk-filtered data
-        X_filt, self.zi_ = yulewalk_filter(
-            X, sfreq=self.sfreq, ab=self.ab_, zi=self.zi_)
+                outs = [self.transform(x) for x in X]
+                return np.stack(outs, 0)
+        else:
+            # Yulewalk-filtered data
+            X_filt, self.zi_ = yulewalk_filter(
+                X, sfreq=self.sfreq, ab=self.ab_, zi=self.zi_)
 
         if not self._fitted:
             logging.warning('ASR is not fitted ! Returning unfiltered data.')
             return X
 
-        cov = 1 / X.shape[-1] * X_filt @ X_filt.T
+        if self.estimator == 'scm':
+            cov = 1 / X.shape[-1] * X_filt @ X_filt.T
+        else:
+            cov = pyriemann.estimation.covariances(X_filt[None, ...],
+                                                   self.estimator)[0]
+
         self._counter.append(X.shape[-1])
         self.cov_.append(cov)
 
@@ -409,9 +419,9 @@ def clean_windows(X, sfreq, max_bad_chans=0.2, zthresholds=[-3.5, 5],
     return clean, sample_mask
 
 
-def asr_calibrate(X, sfreq, cutoff=5, blocksize=10, win_len=0.5,
+def asr_calibrate(X, sfreq, cutoff=5, blocksize=100, win_len=0.5,
                   win_overlap=0.66, max_dropout_fraction=0.1,
-                  min_clean_fraction=0.25, method='euclid'):
+                  min_clean_fraction=0.25, method='euclid', estimator='scm'):
     """Calibration function for the Artifact Subspace Reconstruction method.
 
     The input to this data is a multi-channel time series of calibration data.
@@ -455,8 +465,8 @@ def asr_calibrate(X, sfreq, cutoff=5, blocksize=10, win_len=0.5,
     blocksize : int
         Block size for calculating the robust data covariance and thresholds,
         in samples; allows to reduce the memory and time requirements of the
-        robust estimators by this factor (down to Channels x Channels x Samples
-        x 16 / Blocksize bytes) (default=10).
+        robust estimators by this factor (down to n_chans x n_chans x n_samples
+        x 16 / blocksize bytes) (default=100).
     win_len : float
         Window length that is used to check the data for artifact content. This
         is ideally as long as the expected time scale of the artifacts but
@@ -490,23 +500,18 @@ def asr_calibrate(X, sfreq, cutoff=5, blocksize=10, win_len=0.5,
     # window length for calculating thresholds
     N = int(np.round(win_len * sfreq))
 
+    U = block_covariance(X, window=blocksize, overlap=win_overlap,
+                         estimator=estimator)
     if method == 'euclid':
-        U = np.zeros((blocksize, nc, nc))
-        for k in range(blocksize):
-            rangevect = np.minimum(ns - 1, np.arange(k, ns + k, blocksize))
-            x = X[:, rangevect]
-            U[k, ...] = x @ x.T
         Uavg = block_geometric_median(U.reshape((-1, nc * nc)) / blocksize, 2)
         Uavg = Uavg.reshape((nc, nc))
-    elif method == 'riemann':
-        blocksize = int(ns // blocksize)
-        U = block_covariance(X, window=blocksize, overlap=win_overlap)
+    else:  # method == 'riemann'
         Uavg = pyriemann.utils.mean.mean_covariance(U, metric='riemann')
 
     # get the mixing matrix M
     M = linalg.sqrtm(np.real(Uavg))
     D, Vtmp = linalg.eig(M)
-    # D, Vtmp = nonlinear_eigenspace(M, nc)
+    # D, Vtmp = nonlinear_eigenspace(M, nc)  TODO
     V = Vtmp[:, np.argsort(D)]
 
     # get the threshold matrix T
@@ -573,11 +578,17 @@ def asr_process(X, X_filt, state, cov=None, detrend=False, method='riemann',
     if cov is None:
         if detrend:
             X_filt = signal.detrend(X_filt, axis=1, type='constant')
-        cov = np.cov(X_filt, bias=True)
-    else:
-        if cov.ndim == 3:
+        cov = block_covariance(X_filt, window=nc ** 2)
+
+    cov = cov.squeeze()
+    if cov.ndim == 3:
+        if method == 'riemann':
             cov = pyriemann.utils.mean.mean_covariance(
                 cov, metric='riemann', sample_weight=sample_weight)
+        else:
+            bs = nc ** 2
+            cov = block_geometric_median(cov.reshape((-1, nc * nc)) / bs, bs)
+            cov = cov.reshape((nc, nc))
 
     maxdims = int(np.fix(0.66 * nc))  # constant TODO make param
 
diff --git a/meegkit/utils/asr.py b/meegkit/utils/asr.py
index f93498af..a9e06266 100755
--- a/meegkit/utils/asr.py
+++ b/meegkit/utils/asr.py
@@ -1,10 +1,10 @@
 """Utils for ASR functions."""
 import numpy as np
-from scipy.special import gamma, gammaincinv
 from numpy import linalg
 from numpy.matlib import repmat
 from scipy import signal
 from scipy.linalg import toeplitz
+from scipy.special import gamma, gammaincinv
 
 
 def fit_eeg_distribution(X, min_clean_fraction=0.25, max_dropout_fraction=0.1,
@@ -355,9 +355,9 @@ def block_geometric_median(X, blocksize, tol=1e-5, max_iter=500):
 
     """
     if (blocksize > 1):
-        o, v = X.shape       # #observations & #variables
-        r = np.mod(o, blocksize)  # #rest in last block
-        b = int((o - r) / blocksize)   # #blocks
+        o, v = X.shape  # observations & variables
+        r = np.mod(o, blocksize)  # rest in last block
+        b = int((o - r) / blocksize)  # blocks
         Xreshape = np.zeros((b + 1, v))
         if (r > 0):
             Xreshape[0:b, :] = np.reshape(
@@ -385,23 +385,24 @@ def geometric_median(X, tol, y, max_iter):
 
     Parameters
     ----------
-    X : the data, as in mean
+    X : array, shape=()
+        The data.
     tol : tolerance (default=1.e-5)
     y : initial value (default=median(X))
     max_iter : max number of iterations (default=500)
 
     Returns
     -------
-    g : geometric median over X
+    g : array, shape=()
+        Geometric median over X.
 
     """
     for i in range(max_iter):
         invnorms = 1 / np.sqrt(
             np.sum((X - repmat(y, X.shape[0], 1))**2, axis=1))
         oldy = y
-        y = np.sum(X * np.transpose(
-            repmat(invnorms, X.shape[1], 1)), axis=0
-        ) / np.sum(invnorms)
+        y = np.sum(X * np.transpose(repmat(invnorms, X.shape[1], 1)), axis=0)
+        y /= np.sum(invnorms)
 
         if ((linalg.norm(y - oldy) / linalg.norm(y)) < tol):
             break
diff --git a/meegkit/utils/covariances.py b/meegkit/utils/covariances.py
index 30295be4..e3ae3bd0 100644
--- a/meegkit/utils/covariances.py
+++ b/meegkit/utils/covariances.py
@@ -17,19 +17,24 @@ def block_covariance(data, window=128, overlap=0.5, padding=True,
 
     Parameters
     ----------
-    data : array, shape=(n_channels, n_samples)
+    data : array, shape=(n_chans, n_samples)
         Input data (must be 2D)
     window : int
         Window size.
     overlap : float
         Overlap between successive windows.
 
+    Returns
+    -------
+    cov : array, shape=(n_blocks, n_chans, n_chans)
+        Block covariance.
+
     """
     from pyriemann.utils.covariance import _check_est
 
     assert 0 <= overlap < 1, "overlap must be < 1"
     est = _check_est(estimator)
-    X = []
+    cov = []
     n_chans, n_samples = data.shape
     if padding:  # pad data with zeros
         pad = np.zeros((n_chans, int(window / 2)))
@@ -38,10 +43,10 @@ def block_covariance(data, window=128, overlap=0.5, padding=True,
     jump = int(window * overlap)
     ix = 0
     while (ix + window < n_samples):
-        X.append(est(data[:, ix:ix + window]))
+        cov.append(est(data[:, ix:ix + window]))
         ix = ix + jump
 
-    return np.array(X)
+    return np.array(cov)
 
 
 def cov_lags(X, Y, shifts=None):
diff --git a/tests/test_asr.py b/tests/test_asr.py
index 8a0ac114..31d83717 100644
--- a/tests/test_asr.py
+++ b/tests/test_asr.py
@@ -140,18 +140,18 @@ def test_asr_functions(show=False, method='riemann'):
     if show:
         f, ax = plt.subplots(8, sharex=True, figsize=(8, 5))
         for i in range(8):
-            ax[i].fill_between(train_idx / sfreq, 0, 1, color='grey', alpha=.3,
+            ax[i].fill_between(train_idx, 0, 1, color='grey', alpha=.3,
                                transform=ax[i].get_xaxis_transform(),
                                label='calibration window')
-            ax[i].fill_between(train_idx / sfreq, 0, 1, where=sample_mask.flat,
+            ax[i].fill_between(train_idx, 0, 1, where=sample_mask.flat,
                                transform=ax[i].get_xaxis_transform(),
                                facecolor='none', hatch='...', edgecolor='k',
                                label='selected window')
-            ax[i].plot(raw.times, raw._data[i], lw=.5, label='before ASR')
-            ax[i].plot(raw.times, clean[i], label='after ASR', lw=.5)
+            ax[i].plot(raw[i], lw=.5, label='before ASR')
+            ax[i].plot(clean[i], label='after ASR', lw=.5)
             # ax[i].set_xlim([10, 50])
             ax[i].set_ylim([-50, 50])
-            ax[i].set_ylabel(raw.ch_names[i])
+            # ax[i].set_ylabel(raw.ch_names[i])
             if i < 7:
                 ax[i].set_yticks([])
         ax[i].set_xlabel('Time (s)')
@@ -162,17 +162,37 @@ def test_asr_functions(show=False, method='riemann'):
         plt.show()
 
 
-def test_asr_class(show=False):
+@pytest.mark.parametrize(argnames='method', argvalues=('riemann', 'euclid'))
+@pytest.mark.parametrize(argnames='reref', argvalues=(False, True))
+def test_asr_class(method, reref, show=False):
     """Test ASR class (simulate online use)."""
     from meegkit.utils.matrix import sliding_window
 
-    asr = ASR(method='riemann')
-
     # Train on a clean portion of data
     train_idx = np.arange(5 * sfreq, 45 * sfreq, dtype=int)
-    asr.fit(raw[:, train_idx])
 
-    X = sliding_window(raw, window=int(sfreq), step=int(sfreq))
+    # Rereference
+    if reref:
+        raw2 = raw - np.nanmean(raw, axis=0, keepdims=True)
+    else:
+        raw2 = raw
+
+    # Rank deficient matrix
+    if reref:
+        if method == 'riemann':
+            with pytest.raises(ValueError, match='Add regularization'):
+                asr = ASR(method=method, estimator='scm')
+                asr.fit(raw2[:, train_idx])
+
+            asr = ASR(method=method, estimator='lwf')
+            asr.fit(raw2[:, train_idx])
+        else:
+            asr = ASR(method=method, estimator='scm')
+            asr.fit(raw2[:, train_idx])
+    else:
+        asr = ASR(method=method, estimator='scm')
+
+    X = sliding_window(raw2, window=int(sfreq), step=int(sfreq))
     Y = np.zeros_like(X)
     for i in range(X.shape[1]):
         Y[:, i, :] = asr.transform(X[:, i, :])
@@ -186,7 +206,7 @@ def test_asr_class(show=False):
             ax[i].plot(times, X[i], lw=.5, label='before ASR')
             ax[i].plot(times, Y[i], label='after ASR', lw=.5)
             ax[i].set_ylim([-50, 50])
-            ax[i].set_ylabel(raw.ch_names[i])
+            # ax[i].set_ylabel(raw.ch_names[i])
             if i < 7:
                 ax[i].set_yticks([])
         ax[i].set_xlabel('Time (s)')
@@ -198,9 +218,8 @@ def test_asr_class(show=False):
 
 
 if __name__ == "__main__":
-    import pytest
     pytest.main([__file__])
     # test_yulewalk(250, True)
     # test_asr_functions(True)
-    # test_asr_class(True)
+    # test_asr_class('riemann', True, True)
     # test_yulewalk_filter(16, True)

From 81a73af870741e80cd6c4cc0a5ea272fe6df5620 Mon Sep 17 00:00:00 2001
From: nbara <10333715+nbara@users.noreply.github.com>
Date: Tue, 10 Nov 2020 19:22:05 +0100
Subject: [PATCH 2/7] cleanup messy code

---
 meegkit/utils/asr.py | 125 +++++++++++++------------------------------
 1 file changed, 36 insertions(+), 89 deletions(-)

diff --git a/meegkit/utils/asr.py b/meegkit/utils/asr.py
index a9e06266..2ec2347f 100755
--- a/meegkit/utils/asr.py
+++ b/meegkit/utils/asr.py
@@ -77,7 +77,7 @@ def fit_eeg_distribution(X, min_clean_fraction=0.25, max_dropout_fraction=0.1,
     X = np.sort(X)
     n = len(X)
 
-    # calc z bounds for the truncated standard generalized Gaussian pdf and
+    # compute z bounds for the truncated standard generalized Gaussian pdf and
     # pdf rescaler
     quants = np.array(fit_quantiles)
     zbounds = []
@@ -96,24 +96,27 @@ def fit_eeg_distribution(X, min_clean_fraction=0.25, max_dropout_fraction=0.1,
     # minimum width of the fit interval, as fraction of data
     min_width = min_clean_fraction * max_width
 
-    rowval = np.array(
-        np.round(n * np.arange(lower_min, lower_min +
-                               max_dropout_fraction + (step_sizes[0] * 1e-9),
-                               step_sizes[0])))
-    colval = np.array(np.arange(0, int(np.round(n * max_width))))
-    newX = []
-    for iX in range(len(colval)):
-        newX.append(X[np.int_(iX + rowval)])
-
-    X1 = newX[0]
-    newX = newX - repmat(X1, len(colval), 1)
+    # Build quantile interval matrix
+    rowval = np.arange(lower_min,
+                       lower_min + max_dropout_fraction + step_sizes[0] * 1e-9,
+                       step_sizes[0])
+    rowval = np.round(n * rowval).astype(int)
+    colval = np.arange(0, int(np.round(n * max_width)))
+    newX = np.zeros((len(colval), len(rowval)))
+    for i, c in enumerate(range(len(colval))):
+        newX[i] = X[c + rowval]
+
+    # subtract baseline value for each interval
+    X1 = newX[0, :]
+    newX = newX - X1
     opt_val = np.inf
 
-    for m in (np.round(n * np.arange(max_width, min_width, -step_sizes[1]))):
-        mcurr = int(m - 1)
+    gridsearch = np.round(n * np.arange(max_width, min_width, -step_sizes[1]))
+    for m in gridsearch.astype(int):
+        mcurr = m - 1
         nbins = int(np.round(3 * np.log2(1 + m / 2)))
-        rowval = np.array(nbins / newX[mcurr])
-        H = newX[0:int(m)] * repmat(rowval, int(m), 1)
+        rowval = nbins / newX[mcurr]
+        H = newX[0:m] * repmat(rowval, m, 1)
 
         hist_all = []
         for ih in range(len(rowval)):
@@ -124,29 +127,23 @@ def fit_eeg_distribution(X, min_clean_fraction=0.25, max_dropout_fraction=0.1,
         logq = np.log(hist_all + 0.01)
 
         # for each shape value...
-        for b in range(len(shape_range)):
-            bounds = zbounds[b]
-            x = bounds[0] + (np.arange(0.5, nbins + 0.5) /
-                             nbins * np.diff(bounds))
-            p = np.exp(-np.abs(x)**shape_range[b]) * rescale[b]
+        for k, b in enumerate(shape_range):
+            bounds = zbounds[k]
+            x = bounds[0] + np.arange(0.5, nbins + 0.5) / nbins * np.diff(bounds)  # noqa:E501
+            p = np.exp(-np.abs(x) ** b) * rescale[k]
             p = p / np.sum(p)
 
             # calc KL divergences
-            kl = np.sum(
-                np.transpose(repmat(p, logq.shape[1], 1)) *
-                (np.transpose(repmat(np.log(p), logq.shape[1], 1)) -
-                 logq[:-1, :]),
-                axis=0) + np.log(m)
+            kl = np.sum(p * (np.log(p) - logq[:-1, :].T), axis=1) + np.log(m)
 
             # update optimal parameters
             min_val = np.min(kl)
             idx = np.argmin(kl)
-
-            if (min_val < opt_val):
+            if min_val < opt_val:
                 opt_val = min_val
-                opt_beta = shape_range[b]
+                opt_beta = shape_range[k]
                 opt_bounds = bounds
-                opt_lu = [X1[idx], (X1[idx] + newX[int(m - 1), idx])]
+                opt_lu = [X1[idx], X1[idx] + newX[m - 1, idx]]
 
     # recover distribution parameters at optimum
     alpha = (opt_lu[1] - opt_lu[0]) / np.diff(opt_bounds)
@@ -385,24 +382,24 @@ def geometric_median(X, tol, y, max_iter):
 
     Parameters
     ----------
-    X : array, shape=()
+    X : array, shape=(n_observations, n_variables)
         The data.
     tol : tolerance (default=1.e-5)
-    y : initial value (default=median(X))
-    max_iter : max number of iterations (default=500)
+    y : array, shape=(n_variables)
+        Initial value (default=median(X)).
+    max_iter : int
+        Max number of iterations (default=500):
 
     Returns
     -------
-    g : array, shape=()
+    g : array, shape=(n_variables,)
         Geometric median over X.
 
     """
     for i in range(max_iter):
-        invnorms = 1 / np.sqrt(
-            np.sum((X - repmat(y, X.shape[0], 1))**2, axis=1))
-        oldy = y
-        y = np.sum(X * np.transpose(repmat(invnorms, X.shape[1], 1)), axis=0)
-        y /= np.sum(invnorms)
+        invnorms = 1. / np.sqrt(np.sum((X - y[None, :]) ** 2, axis=1))
+        oldy = y.copy()
+        y = np.sum(X * invnorms[:, None], axis=0) / np.sum(invnorms)
 
         if ((linalg.norm(y - oldy) / linalg.norm(y)) < tol):
             break
@@ -410,56 +407,6 @@ def geometric_median(X, tol, y, max_iter):
     return y
 
 
-def moving_average(N, X, Zi):
-    """Moving-average filter along the second dimension of the data.
-
-    Parameters
-    ----------
-    N : filter length in samples
-    X : data matrix [#Channels x #Samples]
-    Zi : initial filter conditions (default=[])
-
-    Returns
-    -------
-    X : the filtered data
-    Zf : final filter conditions
-
-    Christian Kothe, Swartz Center for Computational Neuroscience, UCSD
-    2012-01-10
-
-    """
-    [C, S] = X.shape
-
-    if Zi is None:
-        Zi = np.zeros((C, N))
-
-    # pre-pend initial state & get dimensions
-    Y = np.concatenate((Zi, X), axis=1)
-    [CC, M] = Y.shape
-
-    # get alternating index vector (for additions & subtractions)
-    idx = np.vstack((np.arange(0, M - N), np.arange(N, M)))
-
-    # get sign vector (also alternating, and includes the scaling)
-    S = np.vstack((- np.ones((1, M - N)), np.ones((1, M - N)))) / N
-
-    # run moving average
-    YS = np.zeros((C, S.shape[1] * 2))
-    for i in range(C):
-        YS[i, :] = Y[i, idx.flatten(order='F')] * S.flatten(order='F')
-
-    X = np.cumsum(YS, axis=1)
-    # read out result
-    X = X[:, 1::2]
-
-    Zf = np.transpose(
-        np.vstack((-((X[:, -1] * N) - Y[:, -N])),
-                  np.transpose(Y[:, -N + 1:]))
-    )
-
-    return X, Zf
-
-
 def polystab(a):
     """Polynomial stabilization.
 

From b260b3495e1f37d3899475dfa969f47f9f8c49e3 Mon Sep 17 00:00:00 2001
From: nbara <10333715+nbara@users.noreply.github.com>
Date: Tue, 10 Nov 2020 22:22:13 +0100
Subject: [PATCH 3/7] more cleanup + fix complex values

---
 meegkit/asr.py       |  33 +++++-----
 meegkit/utils/asr.py | 142 ++++++++++++++++++-------------------------
 tests/conftest.py    |   9 +++
 tests/test_asr.py    |  81 +++++++++++++++---------
 tests/test_cca.py    |  10 +--
 5 files changed, 146 insertions(+), 129 deletions(-)
 create mode 100644 tests/conftest.py

diff --git a/meegkit/asr.py b/meegkit/asr.py
index 86a524f3..d32d0adc 100755
--- a/meegkit/asr.py
+++ b/meegkit/asr.py
@@ -6,7 +6,7 @@
 from statsmodels.robust.scale import mad
 
 from .utils import block_covariance, nonlinear_eigenspace
-from .utils.asr import (block_geometric_median, fit_eeg_distribution, yulewalk,
+from .utils.asr import (geometric_median, fit_eeg_distribution, yulewalk,
                         yulewalk_filter)
 
 try:
@@ -101,7 +101,7 @@ class ASR():
 
     """
 
-    def __init__(self, sfreq=250, cutoff=5, blocksize=10, win_len=0.5,
+    def __init__(self, sfreq=250, cutoff=5, blocksize=100, win_len=0.5,
                  win_overlap=0.66, max_dropout_fraction=0.1,
                  min_clean_fraction=0.25, name='asrfilter', method='euclid',
                  estimator='scm', **kwargs):
@@ -122,9 +122,14 @@ def __init__(self, sfreq=250, cutoff=5, blocksize=10, win_len=0.5,
         self.sfreq = sfreq
         self.estimator = estimator
 
+        self.reset()
+
+    def reset(self):
+        """Reset filter."""
         # Initialise yulewalk-filter coefficients with sensible defaults
-        F = np.array([0, 2, 3, 13, 16, 40, np.minimum(
-            80.0, (sfreq / 2.0) - 1.0), sfreq / 2.0]) * 2.0 / sfreq
+        F = np.array([0, 2, 3, 13, 16, 40,
+                      np.minimum(80.0, (self.sfreq / 2.0) - 1.0),
+                      self.sfreq / 2.0]) * 2.0 / self.sfreq
         M = np.array([3, 0.75, 0.33, 0.33, 1, 1, 3, 3])
         B, A = yulewalk(8, F, M)
         self.ab_ = (A, B)
@@ -134,10 +139,6 @@ def __init__(self, sfreq=250, cutoff=5, blocksize=10, win_len=0.5,
         self._counter = []
         self._fitted = False
 
-    def _reset(self):
-        """Reset filter."""
-        return
-
     def fit(self, X, y=None, **kwargs):
         """Calibration for the Artifact Subspace Reconstruction method.
 
@@ -217,7 +218,7 @@ def transform(self, X, y=None, **kwargs):
                 return out[None, ...]
             else:
                 outs = [self.transform(x) for x in X]
-                return np.stack(outs, 0)
+                return np.stack(outs, axis=0)
         else:
             # Yulewalk-filtered data
             X_filt, self.zi_ = yulewalk_filter(
@@ -233,6 +234,9 @@ def transform(self, X, y=None, **kwargs):
             cov = pyriemann.estimation.covariances(X_filt[None, ...],
                                                    self.estimator)[0]
 
+        if np.sum(np.isnan(cov).flatten()) > 0:
+            print('ho')
+
         self._counter.append(X.shape[-1])
         self.cov_.append(cov)
 
@@ -503,14 +507,14 @@ def asr_calibrate(X, sfreq, cutoff=5, blocksize=100, win_len=0.5,
     U = block_covariance(X, window=blocksize, overlap=win_overlap,
                          estimator=estimator)
     if method == 'euclid':
-        Uavg = block_geometric_median(U.reshape((-1, nc * nc)) / blocksize, 2)
+        Uavg = geometric_median(U.reshape((-1, nc * nc)))
         Uavg = Uavg.reshape((nc, nc))
     else:  # method == 'riemann'
         Uavg = pyriemann.utils.mean.mean_covariance(U, metric='riemann')
 
     # get the mixing matrix M
     M = linalg.sqrtm(np.real(Uavg))
-    D, Vtmp = linalg.eig(M)
+    D, Vtmp = linalg.eigh(M)
     # D, Vtmp = nonlinear_eigenspace(M, nc)  TODO
     V = Vtmp[:, np.argsort(D)]
 
@@ -586,8 +590,7 @@ def asr_process(X, X_filt, state, cov=None, detrend=False, method='riemann',
             cov = pyriemann.utils.mean.mean_covariance(
                 cov, metric='riemann', sample_weight=sample_weight)
         else:
-            bs = nc ** 2
-            cov = block_geometric_median(cov.reshape((-1, nc * nc)) / bs, bs)
+            cov = geometric_median(cov.reshape((-1, nc * nc)))
             cov = cov.reshape((nc, nc))
 
     maxdims = int(np.fix(0.66 * nc))  # constant TODO make param
@@ -596,7 +599,7 @@ def asr_process(X, X_filt, state, cov=None, detrend=False, method='riemann',
     if method == 'riemann':
         D, Vtmp = nonlinear_eigenspace(cov, nc)  # TODO
     else:
-        D, Vtmp = np.linalg.eig(cov)
+        D, Vtmp = linalg.eigh(cov)
 
     V = np.real(Vtmp[:, np.argsort(D)])
     D = np.real(D[np.argsort(D)])
@@ -613,7 +616,7 @@ def asr_process(X, X_filt, state, cov=None, detrend=False, method='riemann',
     else:
         VT = np.dot(V.T, M)
         demux = VT * keep[:, None]
-        R = np.dot(np.dot(M, np.linalg.pinv(demux)), V.T)
+        R = np.dot(np.dot(M, linalg.pinv(demux)), V.T)
 
     if state['R'] is not None:
         # apply the reconstruction to intermediate samples (using raised-cosine
diff --git a/meegkit/utils/asr.py b/meegkit/utils/asr.py
index 2ec2347f..1fd3c06a 100755
--- a/meegkit/utils/asr.py
+++ b/meegkit/utils/asr.py
@@ -1,9 +1,9 @@
 """Utils for ASR functions."""
 import numpy as np
 from numpy import linalg
-from numpy.matlib import repmat
 from scipy import signal
 from scipy.linalg import toeplitz
+from scipy.spatial.distance import cdist, euclidean
 from scipy.special import gamma, gammaincinv
 
 
@@ -97,33 +97,37 @@ def fit_eeg_distribution(X, min_clean_fraction=0.25, max_dropout_fraction=0.1,
     min_width = min_clean_fraction * max_width
 
     # Build quantile interval matrix
-    rowval = np.arange(lower_min,
-                       lower_min + max_dropout_fraction + step_sizes[0] * 1e-9,
-                       step_sizes[0])
-    rowval = np.round(n * rowval).astype(int)
-    colval = np.arange(0, int(np.round(n * max_width)))
-    newX = np.zeros((len(colval), len(rowval)))
-    for i, c in enumerate(range(len(colval))):
-        newX[i] = X[c + rowval]
+    cols = np.arange(lower_min,
+                     lower_min + max_dropout_fraction + step_sizes[0] * 1e-9,
+                     step_sizes[0])
+    cols = np.round(n * cols).astype(int)
+    rows = np.arange(0, int(np.round(n * max_width)))
+    newX = np.zeros((len(rows), len(cols)))
+    for i, c in enumerate(range(len(rows))):
+        newX[i] = X[c + cols]
 
     # subtract baseline value for each interval
     X1 = newX[0, :]
     newX = newX - X1
     opt_val = np.inf
 
+    opt_val = np.inf
+    opt_lu = np.inf
+    opt_bounds = np.inf
+    opt_beta = np.inf
     gridsearch = np.round(n * np.arange(max_width, min_width, -step_sizes[1]))
     for m in gridsearch.astype(int):
         mcurr = m - 1
         nbins = int(np.round(3 * np.log2(1 + m / 2)))
-        rowval = nbins / newX[mcurr]
-        H = newX[0:m] * repmat(rowval, m, 1)
+        cols = nbins / newX[mcurr]
+        H = newX[:m] * cols
 
         hist_all = []
-        for ih in range(len(rowval)):
+        for ih in range(len(cols)):
             histcurr = np.histogram(H[:, ih], bins=np.arange(0, nbins + 1))
             hist_all.append(histcurr[0])
         hist_all = np.array(hist_all, dtype=int).T
-        hist_all = np.vstack((hist_all, np.zeros(len(rowval), dtype=int)))
+        hist_all = np.vstack((hist_all, np.zeros(len(cols), dtype=int)))
         logq = np.log(hist_all + 0.01)
 
         # for each shape value...
@@ -151,7 +155,7 @@ def fit_eeg_distribution(X, min_clean_fraction=0.25, max_dropout_fraction=0.1,
     beta = opt_beta
 
     # calculate the distribution's standard deviation from alpha and beta
-    sig = np.sqrt((alpha**2) * gamma(3 / beta) / gamma(1 / beta))
+    sig = np.sqrt((alpha ** 2) * gamma(3 / beta) / gamma(1 / beta))
 
     return mu, sig, alpha, beta
 
@@ -321,90 +325,64 @@ def yulewalk_filter(X, sfreq, zi=None, ab=None, axis=-1):
     return out, zf
 
 
-def block_geometric_median(X, blocksize, tol=1e-5, max_iter=500):
-    """Calculate a blockwise geometric median.
+def geometric_median(X, tol=1e-5, max_iter=500):
+    """Geometric median.
 
-    This is faster and less memory-intensive than the regular geom_median
-    function. This statistic is not robust to artifacts that persist over a
-    duration that is significantly shorter than the blocksize.
-
-    Parameters
-    ----------
-    X : array, shape=(observations, variables)
-        The data.
-    blocksize : int
-        The number of successive samples over which a regular mean should be
-        taken.
-    tol : float
-        Tolerance (default=1e-5)
-    max_iter : int
-        Max number of iterations (default=500).
-
-    Returns
-    -------
-    g : array,
-        Geometric median over X.
-
-    Notes
-    -----
-    This function is noticeably faster if the length of the data is divisible
-    by the block size. Uses the GPU if available.
-
-    """
-    if (blocksize > 1):
-        o, v = X.shape  # observations & variables
-        r = np.mod(o, blocksize)  # rest in last block
-        b = int((o - r) / blocksize)  # blocks
-        Xreshape = np.zeros((b + 1, v))
-        if (r > 0):
-            Xreshape[0:b, :] = np.reshape(
-                np.sum(np.reshape(X[0:(o - r), :],
-                                  (blocksize, b * v)), axis=0),
-                (b, v))
-            Xreshape[b, :] = np.sum(
-                X[(o - r + 1):o, :], axis=0) * (blocksize / r)
-        else:
-            Xreshape = np.reshape(
-                np.sum(np.reshape(X, (blocksize, b * v)), axis=0), (b, v))
-        X = Xreshape
-
-    y = np.median(X, axis=0)
-    y = geometric_median(X, tol, y, max_iter) / blocksize
-
-    return y
-
-
-def geometric_median(X, tol, y, max_iter):
-    """Calculate the geometric median for a set of observations.
-
-    This is using Weiszfeld's algorithm (mean under a Laplacian noise
-    distribution)
+    This code is adapted from [2]_ using the Vardi and Zhang algorithm
+    described in [1]_.
 
     Parameters
     ----------
     X : array, shape=(n_observations, n_variables)
         The data.
-    tol : tolerance (default=1.e-5)
-    y : array, shape=(n_variables)
-        Initial value (default=median(X)).
+    tol : float
+        Tolerance (default=1.e-5)
     max_iter : int
         Max number of iterations (default=500):
 
     Returns
     -------
-    g : array, shape=(n_variables,)
+    y1 : array, shape=(n_variables,)
         Geometric median over X.
 
+    References
+    ----------
+    .. [1] Vardi, Y., & Zhang, C. H. (2000). The multivariate L1-median and
+       associated data depth. Proceedings of the National Academy of Sciences,
+       97(4), 1423-1426. https://doi.org/10.1073/pnas.97.4.1423
+    .. [2] https://stackoverflow.com/questions/30299267/
     """
-    for i in range(max_iter):
-        invnorms = 1. / np.sqrt(np.sum((X - y[None, :]) ** 2, axis=1))
-        oldy = y.copy()
-        y = np.sum(X * invnorms[:, None], axis=0) / np.sum(invnorms)
+    y = np.mean(X, 0)  # initial value
+
+    i = 0
+    while i < max_iter:
+        D = cdist(X, [y])
+        nonzeros = (D != 0)[:, 0]
+
+        Dinv = 1. / D[nonzeros]
+        Dinvs = np.sum(Dinv)
+        W = Dinv / Dinvs
+        T = np.sum(W * X[nonzeros], 0)
+
+        num_zeros = len(X) - np.sum(nonzeros)
+        if num_zeros == 0:
+            y1 = T
+        elif num_zeros == len(X):
+            return y
+        else:
+            R = (T - y) * Dinvs
+            r = np.linalg.norm(R)
+            rinv = 0 if r == 0 else num_zeros / r
+            y1 = max(0, 1 - rinv) * T + min(1, rinv) * y
 
-        if ((linalg.norm(y - oldy) / linalg.norm(y)) < tol):
-            break
+        if euclidean(y, y1) < tol:
+            return y1
 
-    return y
+        y = y1
+        i += 1
+    else:
+        print(f"Geometric median could converge in {i} iterations "
+              f"with a tolerance of {tol}")
 
 
 def polystab(a):
diff --git a/tests/conftest.py b/tests/conftest.py
new file mode 100644
index 00000000..e9548083
--- /dev/null
+++ b/tests/conftest.py
@@ -0,0 +1,9 @@
+import pytest
+import numpy as np
+import random as rand
+
+
+@pytest.fixture
+def random():
+    rand.seed(9)
+    np.random.seed(9)
diff --git a/tests/test_asr.py b/tests/test_asr.py
index 31d83717..87c25ba9 100644
--- a/tests/test_asr.py
+++ b/tests/test_asr.py
@@ -2,14 +2,15 @@
 import os
 
 import matplotlib.pyplot as plt
-# import mne
 import numpy as np
 import pytest
-
 from meegkit.asr import ASR, asr_calibrate, asr_process, clean_windows
 from meegkit.utils.asr import yulewalk, yulewalk_filter
+from meegkit.utils.matrix import sliding_window
 from scipy import signal
 
+np.random.seed(9)
+
 # Data files
 THIS_FOLDER = os.path.dirname(os.path.abspath(__file__))
 # file = os.path.join(THIS_FOLDER, 'data', 'eeg_raw.fif')
@@ -19,8 +20,6 @@
 # raw.crop(0, 60)  # keep 60s only
 # raw.pick_types(eeg=True, misc=False)
 # raw = raw._data
-raw = np.load(os.path.join(THIS_FOLDER, 'data', 'eeg_raw.npy'))
-sfreq = 250
 
 
 @pytest.mark.parametrize(argnames='sfreq', argvalues=(250, 256, 2048))
@@ -93,15 +92,16 @@ def test_yulewalk(sfreq, show=False):
 @pytest.mark.parametrize(argnames='n_chans', argvalues=(4, 8, 12))
 def test_yulewalk_filter(n_chans, show=False):
     """Test yulewalk filter."""
-    rawp = raw.copy()
-    n_chan_orig = rawp.shape[0]
-    rawp = np.random.randn(n_chans, n_chan_orig) @ rawp
-    raw_filt, iirstate = yulewalk_filter(rawp, sfreq)
+    raw = np.load(os.path.join(THIS_FOLDER, 'data', 'eeg_raw.npy'))
+    sfreq = 250
+    n_chan_orig = raw.shape[0]
+    raw = np.random.randn(n_chans, n_chan_orig) @ raw
+    raw_filt, iirstate = yulewalk_filter(raw, sfreq)
 
     if show:
         f, ax = plt.subplots(n_chans, sharex=True, figsize=(8, 5))
         for i in range(n_chans):
-            ax[i].plot(rawp[i], lw=.5, label='before')
+            ax[i].plot(raw[i], lw=.5, label='before')
             ax[i].plot(raw_filt[i], label='after', lw=.5)
             ax[i].set_ylim([-50, 50])
             if i < n_chans - 1:
@@ -122,6 +122,8 @@ def test_asr_functions(show=False, method='riemann'):
     estimated only once and not updated online as is intended.
 
     """
+    raw = np.load(os.path.join(THIS_FOLDER, 'data', 'eeg_raw.npy'))
+    sfreq = 250
     raw_filt = raw.copy()
     raw_filt, iirstate = yulewalk_filter(raw_filt, sfreq)
 
@@ -166,8 +168,8 @@ def test_asr_functions(show=False, method='riemann'):
 @pytest.mark.parametrize(argnames='reref', argvalues=(False, True))
 def test_asr_class(method, reref, show=False):
     """Test ASR class (simulate online use)."""
-    from meegkit.utils.matrix import sliding_window
-
+    raw = np.load(os.path.join(THIS_FOLDER, 'data', 'eeg_raw.npy'))
+    sfreq = 250
     # Train on a clean portion of data
     train_idx = np.arange(5 * sfreq, 45 * sfreq, dtype=int)
 
@@ -175,30 +177,38 @@ def test_asr_class(method, reref, show=False):
     if reref:
         raw2 = raw - np.nanmean(raw, axis=0, keepdims=True)
     else:
-        raw2 = raw
+        raw2 = raw.copy()
 
     # Rank deficient matrix
     if reref:
         if method == 'riemann':
             with pytest.raises(ValueError, match='Add regularization'):
-                asr = ASR(method=method, estimator='scm')
-                asr.fit(raw2[:, train_idx])
-
-            asr = ASR(method=method, estimator='lwf')
-            asr.fit(raw2[:, train_idx])
-        else:
-            asr = ASR(method=method, estimator='scm')
-            asr.fit(raw2[:, train_idx])
+                blah = ASR(method=method, estimator='scm')
+                blah.fit(raw2[:, train_idx])
+
+        asr = ASR(method=method, estimator='lwf')
+        asr.fit(raw2[:, train_idx])
     else:
         asr = ASR(method=method, estimator='scm')
+        asr.fit(raw2[:, train_idx])
 
-    X = sliding_window(raw2, window=int(sfreq), step=int(sfreq))
+    # Split into small windows
+    X = sliding_window(raw2, window=int(sfreq // 2), step=int(sfreq // 2))
+    X = X.swapaxes(0, 1)
+
+    # Transform each trial
     Y = np.zeros_like(X)
-    for i in range(X.shape[1]):
-        Y[:, i, :] = asr.transform(X[:, i, :])
+    for i in range(X.shape[0]):
+        Y[i] = asr.transform(X[i])
+
+    # Transform all trials at once
+    asr.reset()
+    asr.fit(raw2[:, train_idx])
+    Y2 = asr.transform(X)
 
-    X = X.reshape(8, -1)
-    Y = Y.reshape(8, -1)
+    X = X.swapaxes(0, 1).reshape(8, -1)
+    Y = Y.swapaxes(0, 1).reshape(8, -1)
+    Y2 = Y2.swapaxes(0, 1).reshape(8, -1)
     times = np.arange(X.shape[-1]) / sfreq
     if show:
         f, ax = plt.subplots(8, sharex=True, figsize=(8, 5))
@@ -206,7 +216,7 @@ def test_asr_class(method, reref, show=False):
             ax[i].plot(times, X[i], lw=.5, label='before ASR')
             ax[i].plot(times, Y[i], label='after ASR', lw=.5)
             ax[i].set_ylim([-50, 50])
-            # ax[i].set_ylabel(raw.ch_names[i])
+            ax[i].set_ylabel(f'ch{i}')
             if i < 7:
                 ax[i].set_yticks([])
         ax[i].set_xlabel('Time (s)')
@@ -214,12 +224,27 @@ def test_asr_class(method, reref, show=False):
                      borderaxespad=0)
         plt.subplots_adjust(hspace=0, right=0.75)
         plt.suptitle('Before/after ASR')
+
+        f, ax = plt.subplots(8, sharex=True, figsize=(8, 5))
+        for i in range(8):
+            ax[i].plot(times, Y[i], label='incremental', lw=.5)
+            ax[i].plot(times, Y2[i], label='bulk', lw=.5)
+            ax[i].plot(times, Y[i] - Y2[i], label='difference', lw=.5)
+            if i < 7:
+                ax[i].set_yticks([])
+        ax[i].set_xlabel('Time (s)')
+        plt.suptitle('incremental vs. bulk difference ')
         plt.show()
 
+    # TODO: investigate difference
+    # np.testing.assert_almost_equal(Y, Y2, decimal=4)
+    # assert np.all(np.abs(Y - Y2) < 1), np.max(np.abs(Y - Y2))  # < 1uV diff
+    assert np.all(np.isreal(Y)), "output should be real-valued"
+    assert np.all(np.isreal(Y2)), "output should be real-valued"
 
 if __name__ == "__main__":
-    pytest.main([__file__])
+    # pytest.main([__file__])
     # test_yulewalk(250, True)
     # test_asr_functions(True)
-    # test_asr_class('riemann', True, True)
+    test_asr_class(method='riemann', reref=False, show=False)
     # test_yulewalk_filter(16, True)
diff --git a/tests/test_cca.py b/tests/test_cca.py
index 0bcb85b0..159eceea 100644
--- a/tests/test_cca.py
+++ b/tests/test_cca.py
@@ -219,6 +219,8 @@ def test_cca_crossvalidate_shifts2():
 
 def test_mcca(show=False):
     """Test multiway CCA."""
+    np.random.seed(9)
+
     # We create 3 uncorrelated data sets. There should be no common structure
     # between them.
 
@@ -251,7 +253,7 @@ def test_mcca(show=False):
         ax.plot(np.mean(z ** 2, axis=0), ':o')
         ax.set_ylabel('Power')
         ax.set_xlabel('CC')
-        plt.tight_layout(True)
+        plt.tight_layout()
         plt.show()
 
     # assert np.diag_indices
@@ -286,7 +288,7 @@ def test_mcca(show=False):
         ax.plot(np.mean(z ** 2, axis=0), ':o')
         ax.set_ylabel('Power')
         ax.set_xlabel('CC')
-        plt.tight_layout(True)
+        plt.tight_layout()
         plt.show()
 
     # Third example
@@ -322,12 +324,12 @@ def test_mcca(show=False):
         ax.plot(np.mean(z ** 2, axis=0), ':o')
         ax.set_ylabel('Power')
         ax.set_xlabel('CC')
-        plt.tight_layout(True)
+        plt.tight_layout()
         plt.show()
 
     # Only first 10 components should be non-negligible
     diagonal = np.diag(x.T @ x @ A) ** 2
-    assert np.all(diagonal[:10] > 1)
+    assert np.all(diagonal[:10] > 1), diagonal[:10]
     assert np.all(diagonal[10:] < .01)
 
 if __name__ == '__main__':

From 4a448a944bc3e324ee3b1e197d23860b7a9b2548 Mon Sep 17 00:00:00 2001
From: nbara <10333715+nbara@users.noreply.github.com>
Date: Wed, 11 Nov 2020 00:09:12 +0100
Subject: [PATCH 4/7] make asr appear in codecov?

---
 .github/workflows/pythonpackage.yml | 4 ++--
 meegkit/asr.py                      | 2 --
 2 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/pythonpackage.yml b/.github/workflows/pythonpackage.yml
index 4cbdb3e3..ac2713d4 100644
--- a/.github/workflows/pythonpackage.yml
+++ b/.github/workflows/pythonpackage.yml
@@ -2,7 +2,7 @@ name: unit-tests
 
 on:
   push:
-    branches: 
+    branches:
       - master
   pull_request:
     branches:
@@ -35,7 +35,7 @@ jobs:
         make pep
     - name: Test with pytest
       run: |
-        pytest --cov=meegkit --cov-report=xml tests/
+        pytest --cov=./ --cov-report=xml tests/
     - name: Upload coverage to Codecov
       uses: codecov/codecov-action@v1
       with:
diff --git a/meegkit/asr.py b/meegkit/asr.py
index d32d0adc..85ead2e0 100755
--- a/meegkit/asr.py
+++ b/meegkit/asr.py
@@ -14,8 +14,6 @@
 except ImportError:
     pyriemann = None
 
-__all__ = ['ASR', 'clean_windows', 'asr_calibrate', 'asr_process']
-
 
 class ASR():
     """Artifact Subspace Reconstruction.

From 761d443f3c47ad58ee7b66d721f8d5ed87468543 Mon Sep 17 00:00:00 2001
From: nbara <10333715+nbara@users.noreply.github.com>
Date: Wed, 11 Nov 2020 10:55:12 +0100
Subject: [PATCH 5/7] test sfreq=125

---
 tests/test_asr.py | 22 +++++++++++++++++++---
 1 file changed, 19 insertions(+), 3 deletions(-)

diff --git a/tests/test_asr.py b/tests/test_asr.py
index 87c25ba9..b7f56d22 100644
--- a/tests/test_asr.py
+++ b/tests/test_asr.py
@@ -22,11 +22,18 @@
 # raw = raw._data
 
 
-@pytest.mark.parametrize(argnames='sfreq', argvalues=(250, 256, 2048))
+@pytest.mark.parametrize(argnames='sfreq', argvalues=(125, 250, 256, 2048))
 def test_yulewalk(sfreq, show=False):
     """Test that my version of yulewelk works just like MATLAB's."""
     # Temp fix, values are computed in matlab using yulewalk.m
-    if sfreq == 256:
+    if sfreq == 125:
+        a = [1, -0.983952187817050, -0.520232502560362, 0.603540557711479,
+             0.116893105621457, -0.0291261609247754, -0.282359853603720,
+             0.0407847933579206, 0.103437108246108]
+        b = [1.08742316795540, -1.83643555381637, 0.573976014496824,
+             0.361020603610170, 0.0592714561864745, 0.0767631759850725,
+             -0.498304757808424, 0.276872948140515, -0.00693079202803615]
+    elif sfreq == 256:
         a = [1, -1.70080396393018, 1.92328303910588, -2.08269297269299,
              1.59826387425574, -1.07358541839301, 0.567971922565269,
              -0.188618149976820, 0.0572954115997260]
@@ -175,11 +182,11 @@ def test_asr_class(method, reref, show=False):
 
     # Rereference
     if reref:
+        # Rank deficient matrix
         raw2 = raw - np.nanmean(raw, axis=0, keepdims=True)
     else:
         raw2 = raw.copy()
 
-    # Rank deficient matrix
     if reref:
         if method == 'riemann':
             with pytest.raises(ValueError, match='Add regularization'):
@@ -242,6 +249,15 @@ def test_asr_class(method, reref, show=False):
     assert np.all(np.isreal(Y)), "output should be real-valued"
     assert np.all(np.isreal(Y2)), "output should be real-valued"
 
+    # Test different sampling rates
+    with pytest.raises(ValueError):
+        ASR(sfreq=60)
+
+    ASR(sfreq=80)
+    ASR(sfreq=100)
+    ASR(sfreq=125)
+    ASR(Sfreq=150)
+
 if __name__ == "__main__":
     # pytest.main([__file__])
     # test_yulewalk(250, True)

From eb7c21b4f49b45b15b270adb168c79b2ad3dd219 Mon Sep 17 00:00:00 2001
From: nbara <10333715+nbara@users.noreply.github.com>
Date: Wed, 11 Nov 2020 12:26:35 +0100
Subject: [PATCH 6/7] fix exponential covariance weights

---
 meegkit/asr.py | 19 +++++++++----------
 1 file changed, 9 insertions(+), 10 deletions(-)

diff --git a/meegkit/asr.py b/meegkit/asr.py
index 85ead2e0..343308eb 100755
--- a/meegkit/asr.py
+++ b/meegkit/asr.py
@@ -116,7 +116,8 @@ def __init__(self, sfreq=250, cutoff=5, blocksize=100, win_len=0.5,
         self.min_clean_fraction = min_clean_fraction
         self.max_bad_chans = 0.3
         self.method = method
-        self.memory = 1 * sfreq  # smoothing window for covariances
+        self.memory = int(2 * sfreq)  # smoothing window for covariances
+        self.sample_weight = np.geomspace(0.05, 1, num=self.memory + 1)
         self.sfreq = sfreq
         self.estimator = estimator
 
@@ -232,10 +233,7 @@ def transform(self, X, y=None, **kwargs):
             cov = pyriemann.estimation.covariances(X_filt[None, ...],
                                                    self.estimator)[0]
 
-        if np.sum(np.isnan(cov).flatten()) > 0:
-            print('ho')
-
-        self._counter.append(X.shape[-1])
+        self._counter.append(X_filt.shape[-1])
         self.cov_.append(cov)
 
         # Regulate the number of covariance matrices that are stored
@@ -244,19 +242,20 @@ def transform(self, X, y=None, **kwargs):
                 self.cov_.pop(0)
                 self._counter.pop(0)
             else:
-                self._counter[0] = self.memory
+                self._counter = [self.memory, ]
                 break
 
-        # Exponential covariance weight – the most recent covariance has a
+        # Exponential covariance weights – the most recent covariance has a
         # weight of 1, while the oldest one in memory has a weight of 5%
-        sample_weight = np.geomspace(0.05, 1, num=self.memory + 1)
-        sample_weight = sample_weight[self._counter]
+        weights = [1, ]
+        for c in np.cumsum(self._counter[1:]):
+            weights = [self.sample_weight[-c]] + weights
 
         # Clean data, using covariances weighted by sample_weight
         out, self.state_ = asr_process(X, X_filt, self.state_,
                                        cov=np.stack(self.cov_),
                                        method=self.method,
-                                       sample_weight=sample_weight)
+                                       sample_weight=weights)
 
         return out
 

From 4bbc23d53d5b62afeee8343e733a7407d8cf53e4 Mon Sep 17 00:00:00 2001
From: nbara <10333715+nbara@users.noreply.github.com>
Date: Thu, 12 Nov 2020 10:28:56 +0100
Subject: [PATCH 7/7] Update test_asr.py

---
 tests/test_asr.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/tests/test_asr.py b/tests/test_asr.py
index b7f56d22..6320689b 100644
--- a/tests/test_asr.py
+++ b/tests/test_asr.py
@@ -243,9 +243,9 @@ def test_asr_class(method, reref, show=False):
         plt.suptitle('incremental vs. bulk difference ')
         plt.show()
 
-    # TODO: investigate difference
-    # np.testing.assert_almost_equal(Y, Y2, decimal=4)
-    # assert np.all(np.abs(Y - Y2) < 1), np.max(np.abs(Y - Y2))  # < 1uV diff
+    # TODO: the transform() process is stochastic, so Y and Y2 are not going to
+    # be entirely idetntical but close enough
+    assert np.all(np.abs(Y - Y2) < 5), np.max(np.abs(Y - Y2))  # < 5uV diff
     assert np.all(np.isreal(Y)), "output should be real-valued"
     assert np.all(np.isreal(Y2)), "output should be real-valued"
 
@@ -259,8 +259,8 @@ def test_asr_class(method, reref, show=False):
     ASR(Sfreq=150)
 
 if __name__ == "__main__":
-    # pytest.main([__file__])
+    pytest.main([__file__])
     # test_yulewalk(250, True)
     # test_asr_functions(True)
-    test_asr_class(method='riemann', reref=False, show=False)
+    # test_asr_class(method='riemann', reref=False, show=True)
     # test_yulewalk_filter(16, True)