mne-tools · larsoner · Feb 2, 2024 · Nov 11, 2023 · Nov 11, 2023 · Nov 13, 2023
@@ -819,9 +819,14 @@ def _reject_setup(self, reject, flat):
         # check for invalid values
         for rej, kind in zip((reject, flat), ("Rejection", "Flat")):
             for key, val in rej.items():
-                if val is None or val < 0:
+                if callable(val):
+                    continue
+                elif val is not None and val >= 0:
+                    continue
+                else:
                     raise ValueError(
-                        '%s value must be a number >= 0, not "%s"' % (kind, val)
+                        "%s value must be a number >= 0 or a valid function,"
+                        'not "%s"' % (kind, val)
                     )
 
         # now check to see if our rejection and flat are getting more
@@ -834,33 +839,48 @@ def _reject_setup(self, reject, flat):
             "previous ones"
         )
 
+        # Skip this check if old_reject, reject, old_flat, and flat are
+        # callables
+        is_callable = False
+        for rej in (reject, flat, old_reject, old_flat):
+            for key, val in rej.items():
+                if callable(val):
+                    is_callable = True
+
         # copy thresholds for channel types that were used previously, but not
         # passed this time
         for key in set(old_reject) - set(reject):
             reject[key] = old_reject[key]
-        # make sure new thresholds are at least as stringent as the old ones
-        for key in reject:
-            if key in old_reject and reject[key] > old_reject[key]:
-                raise ValueError(
-                    bad_msg.format(
-                        kind="reject",
-                        key=key,
-                        new=reject[key],
-                        old=old_reject[key],
-                        op=">",
+
+        if not is_callable:
+            # make sure new thresholds are at least as stringent
+            # as the old ones
+            for key in reject:
+                if key in old_reject and reject[key] > old_reject[key]:
+                    raise ValueError(
+                        bad_msg.format(
+                            kind="reject",
+                            key=key,
+                            new=reject[key],
+                            old=old_reject[key],
+                            op=">",
+                        )
                     )
-                )
 
-        # same for flat thresholds
-        for key in set(old_flat) - set(flat):
-            flat[key] = old_flat[key]
-        for key in flat:
-            if key in old_flat and flat[key] < old_flat[key]:
-                raise ValueError(
-                    bad_msg.format(
-                        kind="flat", key=key, new=flat[key], old=old_flat[key], op="<"
+            # same for flat thresholds
+            for key in set(old_flat) - set(flat):
+                flat[key] = old_flat[key]
+            for key in flat:
+                if key in old_flat and flat[key] < old_flat[key]:
+                    raise ValueError(
+                        bad_msg.format(
+                            kind="flat",
+                            key=key,
+                            new=flat[key],
+                            old=old_flat[key],
+                            op="<",
+                        )
                     )
-                )
 
         # after validation, set parameters
         self._bad_dropped = False
@@ -3621,25 +3641,35 @@ def _is_good(
 ):
     """Test if data segment e is good according to reject and flat.
 
+    The reject and flat dictionaries can accept functions as values.
+
     If full_report=True, it will give True/False as well as a list of all
     offending channels.
     """
     bad_tuple = tuple()
     has_printed = False
     checkable = np.ones(len(ch_names), dtype=bool)
     checkable[np.array([c in ignore_chs for c in ch_names], dtype=bool)] = False
+
     for refl, f, t in zip([reject, flat], [np.greater, np.less], ["", "flat"]):
         if refl is not None:
-            for key, thresh in refl.items():
+            for key, criterion in refl.items():
                 idx = channel_type_idx[key]
                 name = key.upper()
                 if len(idx) > 0:
                     e_idx = e[idx]
-                    deltas = np.max(e_idx, axis=1) - np.min(e_idx, axis=1)
                     checkable_idx = checkable[idx]
-                    idx_deltas = np.where(
-                        np.logical_and(f(deltas, thresh), checkable_idx)
-                    )[0]
+
+                    # Check if criterion is a function and apply it
+                    if callable(criterion):
+                        idx_deltas = np.where(
+                            np.logical_and(criterion(e_idx), checkable_idx)
+                        )[0]
+                    else:
+                        deltas = np.max(e_idx, axis=1) - np.min(e_idx, axis=1)
+                        idx_deltas = np.where(
+                            np.logical_and(f(deltas, criterion), checkable_idx)
+                        )[0]
 
                     if len(idx_deltas) > 0:
                         bad_names = [ch_names[idx[i]] for i in idx_deltas]

diff --git a/mne/tests/test_epochs.py b/mne/tests/test_epochs.py
@@ -2128,6 +2128,67 @@ def test_reject_epochs(tmp_path):
     assert epochs_cleaned.flat == dict(grad=new_flat["grad"], mag=flat["mag"])
 
 
+@testing.requires_testing_data
+def test_callable_reject():
+    """Test using a callable for rejection."""
+    raw = read_raw_fif(fname_raw_testing, preload=True)
+    raw.crop(0, 5)
+    raw.del_proj()
+    chans = raw.info["ch_names"][-6:-1]
+    raw.pick(chans)
+    data = raw.get_data()
+
+    # Add some artifacts
+    new_data = data
+    new_data[0, 180:200] *= 1e7
+    new_data[0, 610:880] += 1e-3
+    edit_raw = mne.io.RawArray(new_data, raw.info)
+
+    events = mne.make_fixed_length_events(edit_raw, id=1, duration=1.0, start=0)
+    epochs = mne.Epochs(edit_raw, events, tmin=0, tmax=1, baseline=None, preload=True)
+
+    assert len(epochs) == 5
+    epochs = mne.Epochs(
+        edit_raw,
+        events,
+        tmin=0,
+        tmax=1,
+        baseline=None,
+        reject=dict(
+            eeg=lambda x: True if (np.median(x, axis=1) > 1e-3).any() else False
+        ),
+        preload=True,
+    )
+    assert epochs.drop_log[2] != ()
+
+    epochs = mne.Epochs(
+        edit_raw,
+        events,
+        tmin=0,
+        tmax=1,
+        baseline=None,
+        reject=dict(eeg=lambda x: True if (np.max(x, axis=1) > 1).any() else False),
+        preload=True,
+    )
+    assert epochs.drop_log[0] != ()
+
+    def reject_criteria(x):
+        max_condition = np.max(x, axis=1) > 1e-2
+        median_condition = np.median(x, axis=1) > 1e-4
+        return True if max_condition.any() or median_condition.any() else False
+
+    epochs = mne.Epochs(
+        edit_raw,
+        events,
+        tmin=0,
+        tmax=1,
+        baseline=None,
+        reject=dict(eeg=reject_criteria),
+        preload=True,
+    )
+    assert epochs.drop_log[0] != () and epochs.drop_log[2] != ()
+
+
 def test_preload_epochs():
     """Test preload of epochs."""
     raw, events, picks = _get_data()

diff --git a/mne/utils/docs.py b/mne/utils/docs.py
@@ -1702,11 +1702,14 @@ def _reflow_param_docstring(docstring, has_first_line=True, width=75):
 """
 
 _flat_common = """\
-    Reject epochs based on **minimum** peak-to-peak signal amplitude (PTP).
-    Valid **keys** can be any channel type present in the object. The
-    **values** are floats that set the minimum acceptable PTP. If the PTP
-    is smaller than this threshold, the epoch will be dropped. If ``None``
-    then no rejection is performed based on flatness of the signal."""
+    Reject epochs based on **minimum** peak-to-peak signal amplitude (PTP)
+    or a custom function. Valid **keys** can be any channel type present
+    in the object. If using PTP, **values** are floats that set the minimum
+    acceptable PTP. If the PTP is smaller than this threshold, the epoch
+    will be dropped. If ``None`` then no rejection is performed based on
+    flatness of the signal. If a custom function is used than ``flat`` can be
+    used to reject epochs based on any criteria (including maxima and
+    minima)."""
 
 docdict[
     "flat"
@@ -3794,8 +3797,9 @@ def _reflow_param_docstring(docstring, has_first_line=True, width=75):
 )
 
 _reject_common = """\
-    Reject epochs based on **maximum** peak-to-peak signal amplitude (PTP),
-    i.e. the absolute difference between the lowest and the highest signal
+    Reject epochs based on **maximum** peak-to-peak signal amplitude (PTP)
+    or custom functions. Peak-to-peak signal amplitude is defined as
+    the absolute difference between the lowest and the highest signal
     value. In each individual epoch, the PTP is calculated for every channel.
     If the PTP of any one channel exceeds the rejection threshold, the
     respective epoch will be dropped.
@@ -3811,10 +3815,21 @@ def _reflow_param_docstring(docstring, has_first_line=True, width=75):
                       eog=250e-6      # unit: V (EOG channels)
                       )
 
-    .. note:: Since rejection is based on a signal **difference**
-              calculated for each channel separately, applying baseline
-              correction does not affect the rejection procedure, as the
-              difference will be preserved.
+    Custom rejection criteria can be also be used by passing a callable
+    to the dictionary.
+
+    Example::
+
+        reject = dict(eeg=lambda x: True if (np.max(x, axis=1) >
+                      1e-3).any() else False))
+
+    .. note:: If rejection is based on a signal **difference**
+            calculated for each channel separately, applying baseline
+            correction does not affect the rejection procedure, as the
+            difference will be preserved.
+
+    .. note:: If ``reject`` is a callable, than **any** criteria can be
+            used to reject epochs (including maxima and minima).
 """
 
 docdict[

@@ -23,6 +23,8 @@
 
 import os
 
+import numpy as np
+
 import mne
 
 sample_data_folder = mne.datasets.sample.data_path()
@@ -205,8 +207,8 @@
 # %%
 # .. _`tut-reject-epochs-section`:
 #
-# Rejecting Epochs based on channel amplitude
-# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+# Rejecting Epochs based on peak-to-peak channel amplitude
+# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 #
 # Besides "bad" annotations, the :class:`mne.Epochs` class constructor has
 # another means of rejecting epochs, based on signal amplitude thresholds for
@@ -328,6 +330,99 @@
 epochs.drop_bad(reject=stronger_reject_criteria)
 print(epochs.drop_log)
 
+# %%
+# .. _`tut-reject-epochs-func-section`:
+#
+# Rejecting Epochs using callables (functions)
+# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+# Sometimes it is useful to reject epochs based criteria other than
+# peak-to-peak amplitudes. For example, we might want to reject epochs
+# based on the maximum or minimum amplitude of a channel.
+# In this case, the :class:`mne.Epochs` class constructor also accepts
+# callables (functions) in the ``reject`` and ``flat`` parameters. This
+# allows us to define functions to reject epochs based on our desired criteria.
+#
+# Let's begin by generating Epoch data with large artifacts in one eeg channel
+# in order to demonstrate the versatility of this approach.
+
+raw.crop(0, 5)
+raw.del_proj()
+chans = raw.info["ch_names"][-5:-1]
+raw.pick(chans)
+data = raw.get_data()
+
+new_data = data
+new_data[0, 180:200] *= 1e3
+new_data[0, 460:580] += 1e-3
+edit_raw = mne.io.RawArray(new_data, raw.info)
+
+# Create fixed length epochs of 1 second
+events = mne.make_fixed_length_events(edit_raw, id=1, duration=1.0, start=0)
+epochs = mne.Epochs(edit_raw, events, tmin=0, tmax=1, baseline=None)
+epochs.plot(scalings=dict(eeg=50e-5))
+
+# %%
+# As you can see, we have two large artifacts in the first channel. One large
+# spike in amplitude and one large increase in amplitude.
+
+# Let's try to reject the epoch containing the spike in amplitude based on the
+# maximum amplitude of the first channel.
+
+epochs = mne.Epochs(
+    edit_raw,
+    events,
+    tmin=0,
+    tmax=1,
+    baseline=None,
+    reject=dict(eeg=lambda x: True if (np.max(x, axis=1) > 1e-2).any() else False),
+    preload=True,
+)
+epochs.plot(scalings=dict(eeg=50e-5))
+
+# %%
+# Here, the epoch containing the spike in amplitude was rejected for having a
+# maximum amplitude greater than 1e-2 Volts. Notice the use of the ``any()``
+# function to check if any of the channels exceeded the threshold. We could
+# have also used the ``all()`` function to check if all channels exceeded the
+# threshold.
+
+# Next, let's try to reject the epoch containing the increase in amplitude
+# using the median.
+
+epochs = mne.Epochs(
+    edit_raw,
+    events,
+    tmin=0,
+    tmax=1,
+    baseline=None,
+    reject=dict(eeg=lambda x: True if (np.median(x, axis=1) > 1e-4).any() else False),
+    preload=True,
+)
+epochs.plot(scalings=dict(eeg=50e-5))
+
+# %%
+# Finally, let's try to reject both epochs using a combination of the maximum
+# and median. We'll define a custom function and use boolean operators to
+# combine the two criteria.
+
+
+def reject_criteria(x):
+    max_condition = np.max(x, axis=1) > 1e-2
+    median_condition = np.median(x, axis=1) > 1e-4
+    return True if max_condition.any() or median_condition.any() else False
+
+
+epochs = mne.Epochs(
+    edit_raw,
+    events,
+    tmin=0,
+    tmax=1,
+    baseline=None,
+    reject=dict(eeg=reject_criteria),
+    preload=True,
+)
+epochs.plot(events=True)
+
 # %%
 # Note that a complementary Python module, the `autoreject package`_, uses
 # machine learning to find optimal rejection criteria, and is designed to