From 38d51c3358efb2d8f4d12fdb1a2e533ef31c08ae Mon Sep 17 00:00:00 2001
From: Miles Wells <k1o0@5tk.co>
Date: Mon, 11 Dec 2023 17:02:29 +0200
Subject: [PATCH 1/5] WIP

---
 ibllib/qc/mesoscope.py | 64 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 64 insertions(+)
 create mode 100644 ibllib/qc/mesoscope.py

diff --git a/ibllib/qc/mesoscope.py b/ibllib/qc/mesoscope.py
new file mode 100644
index 000000000..6193cbf23
--- /dev/null
+++ b/ibllib/qc/mesoscope.py
@@ -0,0 +1,64 @@
+"""Mesoscope quality control.
+
+This module runs a list of quality control metrics on the extracted imaging and cell detection
+data.
+"""
+import logging
+from inspect import getmembers, isfunction
+
+from . import base
+
+_log = logging.getLogger(__name__)
+
+
+class MesoscopeQC(base.QC):
+    """A class for computing camera QC metrics."""
+
+    def run(self, update: bool = False, **kwargs) -> (str, dict):
+        """
+        Run mesoscope QC checks and return outcome.
+
+        Parameters
+        ----------
+        update : bool
+            If true, updates the session QC fields on Alyx.
+
+        Returns
+        -------
+        str
+            The overall outcome.
+        dict
+            A map of checks and their outcomes.
+        """
+        _log.info(f'Computing QC outcome for session {self.eid}')
+
+        namespace = 'mesoscope'
+        if all(x is None for x in self.data.values()):
+            self.load_data(**kwargs)
+        if self.data['frame_samples'] is None or self.data['timestamps'] is None:
+            return 'NOT_SET', {}
+        if self.data['timestamps'].shape[0] == 0:
+            _log.error(f'No timestamps for {self.label} camera; setting outcome to CRITICAL')
+            return 'CRITICAL', {}
+
+        def is_metric(x):
+            return isfunction(x) and x.__name__.startswith('check_')
+
+        checks = getmembers(self.__class__, is_metric)
+        self.metrics = {f'_{namespace}_' + k[6:]: fn(self) for k, fn in checks}
+
+        values = [x if isinstance(x, str) else x[0] for x in self.metrics.values()]
+        code = max(base.CRITERIA[x] for x in values)
+        outcome = next(k for k, v in base.CRITERIA.items() if v == code)
+
+        if update:
+            extended = {
+                k: 'NOT_SET' if v is None else v
+                for k, v in self.metrics.items()
+            }
+            self.update_extended_qc(extended)
+            self.update(outcome, namespace)
+        return outcome, self.metrics
+
+    def check_data_lengths(self, **kwargs):
+        return 'NOT_SET'

From 839983a643c4e08da8bedcb8cceb48149a1bd724 Mon Sep 17 00:00:00 2001
From: Miles Wells <k1o0@5tk.co>
Date: Thu, 19 Dec 2024 15:14:58 +0200
Subject: [PATCH 2/5] ROI QC metrics

---
 ibllib/pipes/mesoscope_tasks.py |   2 +-
 ibllib/qc/mesoscope.py          | 121 ++++++++++++++++++++++++++++++++
 2 files changed, 122 insertions(+), 1 deletion(-)

diff --git a/ibllib/pipes/mesoscope_tasks.py b/ibllib/pipes/mesoscope_tasks.py
index 419cbc4fe..9bb0445d3 100644
--- a/ibllib/pipes/mesoscope_tasks.py
+++ b/ibllib/pipes/mesoscope_tasks.py
@@ -503,7 +503,7 @@ def _consolidate_exptQC(exptQC):
         qc_labels = ['ok']
         frame_qc = []
         for e in exptQC:
-            assert e.keys() >= set(['frameQC_names', 'frameQC_frames'])
+            assert e.keys() >= {'frameQC_names', 'frameQC_frames'}
             # Initialize an NaN array the same size of frameQC_frames to fill with new enum values
             frames = np.full(e['frameQC_frames'].shape, fill_value=np.nan)
             # May be numpy array of str or a single str, in both cases we cast to list of str
diff --git a/ibllib/qc/mesoscope.py b/ibllib/qc/mesoscope.py
index 6193cbf23..e140486d1 100644
--- a/ibllib/qc/mesoscope.py
+++ b/ibllib/qc/mesoscope.py
@@ -5,12 +5,129 @@
 """
 import logging
 from inspect import getmembers, isfunction
+import unittest
+from pathlib import Path
+
+import numpy as np
+import scipy.stats
 
 from . import base
 
 _log = logging.getLogger(__name__)
 
 
+def get_neural_quality_metrics(F, Fneu, badframes=None, iscell=None, F0_percentile=20, neuropil_factor=.7, **kwargs):
+    """Compute neural quality metrics based on raw fluorescence traces.
+
+    Parameters
+    ----------
+    F : numpy.array
+        Raw fluorescence trace (nROIs by nTimepoints), e.g. mpci.ROINeuropilActivityF.
+    Fneu : numpy.array
+        Raw neuropil trace (nROIs by nTimepoints), e.g. mpci.ROIActivityF.
+    badframes : numpy.array
+        Indices of frames that should be excluded (default = all false).
+    iscell : numpy.array
+        Boolean array with true for cells, and false for not cells (default = all true).
+    F0_percentile : int
+        Percentile to be used for computing baseline fluorescence F0 (default = 20).
+    neuropil_factor : float
+        Factor to multiply neuropil with to get neuropil-corrected trace (default = 0.7).
+        Must be between 0 and 1.
+    times : numpy.array
+        An array of frame times used to infer the frame rate, e.g. mpci.times.
+    frame_rate : float
+        The known frame rate of acquisition in Hz.  This value takes precedence when times
+        also passed in. If neither times nor frame_rate passed, defaults to 7 Hz.
+
+    Returns
+    -------
+    dict
+        A dictionary with the following keys:
+            noiseLevel: standardized shot noise level
+            mean: time-averaged raw fluorescence (proxy for overall brightness)
+            std: standard deviation of neuropil-corrected activity
+            skew: skewness of neuropil-corrected activity
+        Each averaged across all ROIs.
+    numpy.array
+        A structured numpy array with the fields noise_level, mean, std, and skew. One value
+        per ROI.
+    """
+    if 'frame_rate' in kwargs:
+        if (frame_rate := kwargs['frame_rate']) <= 0:
+            raise ValueError('frame_rate must be positive')
+        _log.info('Frame rate: %.2f Hz', frame_rate)
+    elif 'times' in kwargs:
+        frame_rate = 1 / np.median(np.diff(kwargs['times']))
+        _log.info('Inferred frame rate of %.2f Hz from frame times', frame_rate)
+    else:
+        frame_rate = 7
+        _log.warning('Assuming frame rate of %.2f Hz', frame_rate)
+    if badframes is None:
+        badframes = np.zeros(F.shape[0], dtype=bool)
+    elif not isinstance(badframes, np.array):
+        raise TypeError(f'expected `badframes` to by numpy array, got `{type(badframes)}` instead')
+    if iscell is None:
+        iscell = np.ones(F.shape[0], dtype=bool)
+    if neuropil_factor <= 0 or neuropil_factor > 1:
+        raise ValueError('neuropil_factor must be between zero and one')
+
+    # only take the good frames
+    F = F[~badframes, :]
+    Fneu = Fneu[~badframes, :]
+
+    # F_npc is neuropil corrected trace
+    F_npc = F - neuropil_factor * Fneu
+
+    # dFF is deltaF / F0 in %, i.e. baseline-normalized fluorescence trace
+    if F0_percentile is None:
+        dFF = F
+    else:
+        F0 = np.percentile(F, F0_percentile, axis=0)  # F0 is some percentile of full trace
+        F0_ = np.tile(F0, (F.shape[0], 1))
+        dFF = (F - F0_) / F0_ * 100
+
+    # compute noise level
+    noise_levels = np.nanmedian(np.abs(np.diff(dFF, axis=0)), axis=0) / np.sqrt(frame_rate)  # Rupprecht et al. 2021
+
+    # compute time-averaged raw fluorescence (proxy for overall brightness)
+    means = np.mean(F, axis=0)
+
+    # compute standard deviation of neuropil-corrected activity
+    stds = np.std(F_npc, axis=0, ddof=0)
+
+    # compute skewness of neuropil-corrected activity
+    skews = scipy.stats.skew(F_npc, axis=0, bias=True)
+
+    metrics = {'noise_level': noise_levels, 'mean': means, 'std': stds, 'skew': skews}
+
+    # return all the neural quality metrics in a struct
+    fov_metrics = np.rec.fromarrays(metrics.values(), dtype=np.dtype([(k, F.dtype) for k in metrics]))
+
+    # return all the FOV-wide mean quality metrics in a struct
+    neural_metrics = {k: np.nanmean(v[iscell]) for k, v in metrics.items()}
+    return neural_metrics, fov_metrics
+
+
+class TestQM(unittest.TestCase):
+    def setUp(self):
+        self.data_path = Path(r'E:\integration\mesoscope\SP037\2023-03-23\002\alf\suite2p\plane2')
+
+    def test_neural_qm(self):
+        F = np.load(self.data_path / 'F.npy').T
+        Fneu = np.load(self.data_path / 'Fneu.npy').T
+        iscell = np.load(self.data_path / 'iscell.npy')
+        neural_metrics, fov_metrics = get_neural_quality_metrics(F, Fneu, iscell=iscell[:, 0].astype(bool))
+        expected = {'noise_level', 'mean', 'std', 'skew'}
+        self.assertCountEqual(expected, neural_metrics)
+        np.testing.assert_approx_equal(neural_metrics['noise_level'], 3.8925, significant=5)
+        np.testing.assert_approx_equal(neural_metrics['mean'], 983.0024)
+        np.testing.assert_approx_equal(neural_metrics['std'], 120.6435)
+        np.testing.assert_approx_equal(neural_metrics['skew'], 1.0478, significant=5)
+        self.assertCountEqual(expected, fov_metrics.dtype.names)
+        self.assertTrue(all(fov_metrics[x].size == F.shape[1] for x in expected))
+
+
 class MesoscopeQC(base.QC):
     """A class for computing camera QC metrics."""
 
@@ -62,3 +179,7 @@ def is_metric(x):
 
     def check_data_lengths(self, **kwargs):
         return 'NOT_SET'
+
+
+if __name__ == '__main__':
+    unittest.main()

From 136f7cfae6dee54f59bb3613bf6768e08cc329b3 Mon Sep 17 00:00:00 2001
From: Miles Wells <k1o0@5tk.co>
Date: Tue, 18 Mar 2025 13:11:39 +0200
Subject: [PATCH 3/5] Boilerplate QC

---
 ibllib/qc/mesoscope.py | 99 +++++++++++++++++++++++++++++++++++++-----
 1 file changed, 88 insertions(+), 11 deletions(-)

diff --git a/ibllib/qc/mesoscope.py b/ibllib/qc/mesoscope.py
index e140486d1..a768ad282 100644
--- a/ibllib/qc/mesoscope.py
+++ b/ibllib/qc/mesoscope.py
@@ -10,6 +10,7 @@
 
 import numpy as np
 import scipy.stats
+from one.alf.spec import is_uuid
 
 from . import base
 
@@ -127,11 +128,27 @@ def test_neural_qm(self):
         self.assertCountEqual(expected, fov_metrics.dtype.names)
         self.assertTrue(all(fov_metrics[x].size == F.shape[1] for x in expected))
 
+    def test_qc_class(self):
+        ...
+
 
 class MesoscopeQC(base.QC):
-    """A class for computing camera QC metrics."""
+    """A class for computing mesoscope QC FOV metrics."""
+
+    def _confirm_endpoint_id(self, endpoint_id):
+        """Confirm the endpoint ID and set the name attribute.
 
-    def run(self, update: bool = False, **kwargs) -> (str, dict):
+        If the endpoint ID is a UUID, the name attribute is set to the name of the FOV from Alyx.
+        Otherwise the name attribute is set to the endpoint ID (assumed to be either FOV_XX or planeX).
+        """
+        if not is_uuid(endpoint_id, versions=(4,)):
+            self.log.debug('Offline mode; skipping endpoint_id check')
+            self.name = endpoint_id
+            return
+        super()._confirm_endpoint_id(endpoint_id)
+        self.name = self.one.alyx.rest('field-of-views', 'read', id=endpoint_id)['name']
+
+    def run(self, update: bool = False, **kwargs):
         """
         Run mesoscope QC checks and return outcome.
 
@@ -147,16 +164,11 @@ def run(self, update: bool = False, **kwargs) -> (str, dict):
         dict
             A map of checks and their outcomes.
         """
-        _log.info(f'Computing QC outcome for session {self.eid}')
+        _log.info(f'Computing QC outcome for FOV {self.eid}')
 
         namespace = 'mesoscope'
-        if all(x is None for x in self.data.values()):
+        if not getattr(self, 'data', {}):
             self.load_data(**kwargs)
-        if self.data['frame_samples'] is None or self.data['timestamps'] is None:
-            return 'NOT_SET', {}
-        if self.data['timestamps'].shape[0] == 0:
-            _log.error(f'No timestamps for {self.label} camera; setting outcome to CRITICAL')
-            return 'CRITICAL', {}
 
         def is_metric(x):
             return isfunction(x) and x.__name__.startswith('check_')
@@ -177,8 +189,73 @@ def is_metric(x):
             self.update(outcome, namespace)
         return outcome, self.metrics
 
-    def check_data_lengths(self, **kwargs):
-        return 'NOT_SET'
+    def load_data(self):
+        """Load the data required for QC checks."""
+        self.data = {}
+        if self.name.startswith('FOV_'):
+            # Load mpci objects
+            alf_path = self.session_path.joinpath('alf', self.eid)
+            self.data['F'] = np.load(alf_path.joinpath('mpci.ROIActivityF.npy')).T
+            self.data['Fneu'] = np.load(alf_path.joinpath('mpci.ROINeuropilActivityF.npy')).T
+            self.data['iscell'] = np.load(alf_path.joinpath('mpciROIs.mpciROITypes.npy'))
+            self.data['badframes'] = np.load(alf_path.joinpath('mpci.badFrames.npy'))
+            s2pdata = np.load(alf_path.joinpath('_suite2p_ROIData.raw.zip'), allow_pickle=True)  # lazy load from zip
+            self.data['ops'] = s2pdata['ops'].item()
+            self.data['times'] = np.load(alf_path.joinpath('mpci.times.npy'))
+        elif self.name.startswith('plane'):
+            # Load suite2p objects
+            alf_path = self.session_path.joinpath('suite2p', self.eid)
+            self.data['F'] = np.load(alf_path.joinpath('F.npy'))
+            self.data['Fneu'] = np.load(alf_path.joinpath('Fneu.npy'))
+            self.data['iscell'] = np.load(alf_path.joinpath('iscell.npy'))
+            self.data['badframes'] = np.load(alf_path.joinpath('mpci.badFrames.npy.npy'))
+            self.data['ops'] = np.load(alf_path.joinpath('ops.npy'), allow_pickle=True).item()
+            self.data['times'] = None
+        else:
+            raise ValueError(f'Invalid session identifier: {self.eid}')
+
+    def check_neural_quality(self, **kwargs):
+        """Check the neural quality metrics."""
+        neural_metrics, fov_metrics = get_neural_quality_metrics(**self.data, **kwargs)
+        # TODO Apply thresholds
+        raise NotImplementedError
+
+    @staticmethod
+    def qc_session(eid, one=None, **kwargs):
+        """Run mesoscope QC checks on a session.
+
+        This instantiates a MesoscopeQC object and runs the checks for each FOV in the session.
+        It's not ideal to have one QC object per FOV - this could also be a single class that updates
+        both the session endpoint and the FOV endpoints.
+
+        The QC may be run on a local session before the suite2p outputs have been renamed to ALF format,
+        however to update the FOV endpoint, this relies on the MesoscopeFOV task having been run, and for the
+        data, the MesoscopePreprocess task.
+        """
+        session_qc = base.QC(eid, one=one)
+        one = session_qc.one
+        remote = session_qc.one and not session_qc.one.offline
+        if remote:
+            collections = session_qc.one.list_collections(eid, collection='alf/FOV_??')
+            collections = sorted(map(session_qc.session_path.joinpath, collections))
+            FOVs = one.alyx.rest('fields-of-view', 'list', session=session_qc.eid)
+            for collection in collections:
+                endpoint_id = next((x['id'] for x in FOVs if x['name'] == collection.name), None)
+                if not endpoint_id:
+                    _log.warning(f'No Alyx record for FOV {collection.name}')
+                    continue
+                qc = MesoscopeQC(endpoint_id, one=one, endpoint='fields-of-view')
+                qc.session_path = session_qc.session_path
+                outcomes, extended = qc.run(update=False)
+        else:
+            collections = sorted(session_qc.session_path.glob('alf/FOV_??'))
+            if not collections:
+                collections = sorted(session_qc.session_path.glob('suite2p/plane*'))
+            for collection in collections:
+                qc = MesoscopeQC(collection.name, one=one, endpoint='fields-of-view')
+                qc.session_path = session_qc.session_path
+                outcomes, extended = qc.run(update=False)
+                # TODO Log or store outcomes for each FOV
 
 
 if __name__ == '__main__':

From 6e2a22b5ccb95259f1b1c0e6a6e73ba3ae544c04 Mon Sep 17 00:00:00 2001
From: Mayo Faulkner <mayo.faulkner@ucl.ac.uk>
Date: Wed, 2 Apr 2025 16:40:24 +0100
Subject: [PATCH 4/5] mesoscope qc updates

---
 ibllib/pipes/dynamic_pipeline.py     |   3 +
 ibllib/pipes/mesoscope_tasks.py      |  44 +++++++
 ibllib/qc/mesoscope.py               | 179 ++++++++++++++++++++++++---
 ibllib/tests/qc/test_mesoscope_qc.py | 174 ++++++++++++++++++++++++++
 4 files changed, 383 insertions(+), 17 deletions(-)
 create mode 100644 ibllib/tests/qc/test_mesoscope_qc.py

diff --git a/ibllib/pipes/dynamic_pipeline.py b/ibllib/pipes/dynamic_pipeline.py
index a7f64e8e4..a17257247 100644
--- a/ibllib/pipes/dynamic_pipeline.py
+++ b/ibllib/pipes/dynamic_pipeline.py
@@ -586,6 +586,9 @@ def make_pipeline(session_path, **pkwargs):
             **kwargs, **mscope_kwargs, **sync_kwargs)
         tasks['MesoscopeCompress'] = type('MesoscopeCompress', (mscope_tasks.MesoscopeCompress,), {})(
             **kwargs, **mscope_kwargs, parents=[tasks['MesoscopePreprocess']])
+        # TODO update with relevant parent dependencies once QC finalised
+        tasks['MesoscopeQC'] = type('MesoscopeCompress', (mscope_tasks.MesoscopeQC,), {})(
+            **kwargs, **mscope_kwargs, parents=[tasks['MesoscopePreprocess'], tasks['MesoscopeSync']])
 
     if 'neurophotometrics' in devices:
         # {'collection': 'raw_photometry_data', 'datetime': '2024-09-18T16:43:55.207000',
diff --git a/ibllib/pipes/mesoscope_tasks.py b/ibllib/pipes/mesoscope_tasks.py
index 9bb0445d3..be08e5336 100644
--- a/ibllib/pipes/mesoscope_tasks.py
+++ b/ibllib/pipes/mesoscope_tasks.py
@@ -40,6 +40,7 @@
 from ibllib.pipes import base_tasks
 from ibllib.oneibl.data_handlers import ExpectedDataset, dataset_from_name
 from ibllib.io.extractors import mesoscope
+import ibllib.qc.mesoscope as mesoQC
 
 
 _logger = logging.getLogger(__name__)
@@ -1372,6 +1373,49 @@ def project_mlapdv(self, meta, atlas=None):
         return mlapdv, location_id
 
 
+class MesoscopeQC(base_tasks.MesoscopeTask):
+    """Create FOV and FOV location objects in Alyx from metadata."""
+
+    priority = 40
+    job_size = 'small'
+
+    @property
+    def signature(self):
+        signature = {
+            'input_files': [('mpci.ROIActivityF.npy', 'alf/FOV*', True),
+                            ('mpci.ROINeuropilActivityF.npy', 'alf/FOV*', True),
+                            ('mpci.ROIActivityDeconvolved.npy', 'alf/FOV*', True),
+                            ('mpci.badFrames.npy', 'alf/FOV*', True),
+                            ('mpci.mpciFrameQC.npy', 'alf/FOV*', True),
+                            ('mpciFrameQC.names.tsv', 'alf/FOV*', True),
+                            ('mpciMeanImage.images.npy', 'alf/FOV*', True),
+                            ('mpciROIs.stackPos.npy', 'alf/FOV*', True),
+                            ('mpciROIs.mpciROITypes.npy', 'alf/FOV*', True),
+                            ('mpciROIs.cellClassifier.npy', 'alf/FOV*', True),
+                            ('mpciROIs.uuids.csv', 'alf/FOV*', True),
+                            ('mpciROITypes.names.tsv', 'alf/FOV*', True),
+                            ('mpciROIs.masks.sparse_npz', 'alf/FOV*', True),
+                            ('mpciROIs.neuropilMasks.sparse_npz', 'alf/FOV*', True),
+                            ('mpci.times.npy', 'alf/FOV*', True),
+                            ('mpciStack.timeshift.npy', 'alf/FOV*', True)],
+            'output_files': []
+        }
+        return signature
+
+    def _run(self, **kwargs):
+
+        assert self.eid
+        assert self.one and not self.one.offline
+
+        update = kwargs.pop('update', True)
+        outcome = mesoQC.MesoscopeQC.qc_session(self.eid, one=self, update=update, **kwargs)
+
+        if update:
+            mesoQC.update_dataset_qc_for_session(self.eid, outcome, [],
+                                                 self.one, override=False)
+        return []
+
+
 def surface_normal(triangle):
     """
     Calculate the surface normal unit vector of one or more triangles.
diff --git a/ibllib/qc/mesoscope.py b/ibllib/qc/mesoscope.py
index a768ad282..e4dcaf3f7 100644
--- a/ibllib/qc/mesoscope.py
+++ b/ibllib/qc/mesoscope.py
@@ -4,12 +4,15 @@
 data.
 """
 import logging
+from collections import defaultdict
 from inspect import getmembers, isfunction
 import unittest
-from pathlib import Path
+from pathlib import Path, PurePosixPath
+from functools import wraps
 
 import numpy as np
 import scipy.stats
+from one.alf import spec
 from one.alf.spec import is_uuid
 
 from . import base
@@ -66,7 +69,7 @@ def get_neural_quality_metrics(F, Fneu, badframes=None, iscell=None, F0_percenti
         _log.warning('Assuming frame rate of %.2f Hz', frame_rate)
     if badframes is None:
         badframes = np.zeros(F.shape[0], dtype=bool)
-    elif not isinstance(badframes, np.array):
+    elif not isinstance(badframes, np.ndarray):
         raise TypeError(f'expected `badframes` to by numpy array, got `{type(badframes)}` instead')
     if iscell is None:
         iscell = np.ones(F.shape[0], dtype=bool)
@@ -128,8 +131,21 @@ def test_neural_qm(self):
         self.assertCountEqual(expected, fov_metrics.dtype.names)
         self.assertTrue(all(fov_metrics[x].size == F.shape[1] for x in expected))
 
-    def test_qc_class(self):
-        ...
+
+def return_qc_datasets(datasets):
+    """
+    Decorator that allows a function to return a predefined list of dataset names
+    when the `only_dsets` keyword argument is set to True.
+    """
+    def decorator(func):
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            only_dsets = kwargs.pop('only_dsets', False)
+            if only_dsets:
+                return datasets
+            return func(*args, **kwargs)
+        return wrapper
+    return decorator
 
 
 class MesoscopeQC(base.QC):
@@ -139,11 +155,12 @@ def _confirm_endpoint_id(self, endpoint_id):
         """Confirm the endpoint ID and set the name attribute.
 
         If the endpoint ID is a UUID, the name attribute is set to the name of the FOV from Alyx.
-        Otherwise the name attribute is set to the endpoint ID (assumed to be either FOV_XX or planeX).
+        Otherwise, the name attribute is set to the endpoint ID (assumed to be either FOV_XX or planeX).
         """
         if not is_uuid(endpoint_id, versions=(4,)):
             self.log.debug('Offline mode; skipping endpoint_id check')
             self.name = endpoint_id
+            self.eid = None
             return
         super()._confirm_endpoint_id(endpoint_id)
         self.name = self.one.alyx.rest('field-of-views', 'read', id=endpoint_id)['name']
@@ -163,6 +180,8 @@ def run(self, update: bool = False, **kwargs):
             The overall outcome.
         dict
             A map of checks and their outcomes.
+        dict
+            A dict of datasets and their outcomes
         """
         _log.info(f'Computing QC outcome for FOV {self.eid}')
 
@@ -174,11 +193,21 @@ def is_metric(x):
             return isfunction(x) and x.__name__.startswith('check_')
 
         checks = getmembers(self.__class__, is_metric)
+
         self.metrics = {f'_{namespace}_' + k[6:]: fn(self) for k, fn in checks}
+        self.datasets = {f'_{namespace}_' + k[6:]: fn(self, only_dsets=True) for k, fn in checks}
 
-        values = [x if isinstance(x, str) else x[0] for x in self.metrics.values()]
-        code = max(base.CRITERIA[x] for x in values)
-        outcome = next(k for k, v in base.CRITERIA.items() if v == code)
+        values = [x if isinstance(x, spec.QC) else x[0] for x in self.metrics.values()]
+        outcome = self.overall_outcome(values)
+
+        # For each dataset get a list of qc values from relevant qc tests
+        datasets = defaultdict(list)
+        for check, dsets in self.datasets.items():
+            qc_val = self.metrics[check] if isinstance(self.metrics[check], spec.QC) else self.metrics[check][0]
+            for dset in dsets:
+                datasets[dset].append(qc_val)
+        # Compute the final qc for each dataset, takes the worst value
+        dataset_qc = {k: self.overall_outcome(v) for k, v in datasets.items()}
 
         if update:
             extended = {
@@ -187,16 +216,17 @@ def is_metric(x):
             }
             self.update_extended_qc(extended)
             self.update(outcome, namespace)
-        return outcome, self.metrics
+
+        return outcome, self.metrics, dataset_qc
 
     def load_data(self):
         """Load the data required for QC checks."""
         self.data = {}
         if self.name.startswith('FOV_'):
             # Load mpci objects
-            alf_path = self.session_path.joinpath('alf', self.eid)
-            self.data['F'] = np.load(alf_path.joinpath('mpci.ROIActivityF.npy')).T
-            self.data['Fneu'] = np.load(alf_path.joinpath('mpci.ROINeuropilActivityF.npy')).T
+            alf_path = self.session_path.joinpath('alf', self.name)
+            self.data['F'] = np.load(alf_path.joinpath('mpci.ROIActivityF.npy'))
+            self.data['Fneu'] = np.load(alf_path.joinpath('mpci.ROINeuropilActivityF.npy'))
             self.data['iscell'] = np.load(alf_path.joinpath('mpciROIs.mpciROITypes.npy'))
             self.data['badframes'] = np.load(alf_path.joinpath('mpci.badFrames.npy'))
             s2pdata = np.load(alf_path.joinpath('_suite2p_ROIData.raw.zip'), allow_pickle=True)  # lazy load from zip
@@ -204,7 +234,7 @@ def load_data(self):
             self.data['times'] = np.load(alf_path.joinpath('mpci.times.npy'))
         elif self.name.startswith('plane'):
             # Load suite2p objects
-            alf_path = self.session_path.joinpath('suite2p', self.eid)
+            alf_path = self.session_path.joinpath('suite2p', self.name)
             self.data['F'] = np.load(alf_path.joinpath('F.npy'))
             self.data['Fneu'] = np.load(alf_path.joinpath('Fneu.npy'))
             self.data['iscell'] = np.load(alf_path.joinpath('iscell.npy'))
@@ -214,11 +244,26 @@ def load_data(self):
         else:
             raise ValueError(f'Invalid session identifier: {self.eid}')
 
+    @return_qc_datasets(['mpci.ROIActivityF.npy', 'mpci.ROINeuropilActivityF.npy', 'mpciROIs.mpciROITypes.npy',
+                         'mpci.times.npy'])
     def check_neural_quality(self, **kwargs):
         """Check the neural quality metrics."""
         neural_metrics, fov_metrics = get_neural_quality_metrics(**self.data, **kwargs)
+
         # TODO Apply thresholds
-        raise NotImplementedError
+        return spec.QC.WARNING, neural_metrics  # Don't return fov_metric as this is one per cell which is large
+        # raise NotImplementedError
+
+    @return_qc_datasets(['mpci.times.npy'])
+    def check_timestamps_consistency(self, **kwargs):
+        """Check the timestamps are the same length as the fluorescence data"""
+
+        if self.data['times'] is None:
+            return spec.QC.NOT_SET
+
+        metrics = spec.QC.PASS if self.data['times'].size == self.data['F'].shape[0] else spec.QC.FAIL
+
+        return metrics
 
     @staticmethod
     def qc_session(eid, one=None, **kwargs):
@@ -232,9 +277,11 @@ def qc_session(eid, one=None, **kwargs):
         however to update the FOV endpoint, this relies on the MesoscopeFOV task having been run, and for the
         data, the MesoscopePreprocess task.
         """
+        update = kwargs.pop('update', False)
         session_qc = base.QC(eid, one=one)
         one = session_qc.one
         remote = session_qc.one and not session_qc.one.offline
+        fov_qcs = dict()
         if remote:
             collections = session_qc.one.list_collections(eid, collection='alf/FOV_??')
             collections = sorted(map(session_qc.session_path.joinpath, collections))
@@ -246,7 +293,7 @@ def qc_session(eid, one=None, **kwargs):
                     continue
                 qc = MesoscopeQC(endpoint_id, one=one, endpoint='fields-of-view')
                 qc.session_path = session_qc.session_path
-                outcomes, extended = qc.run(update=False)
+                fov_qcs[f'alf/{collection.name}'] = qc.run(update=update)
         else:
             collections = sorted(session_qc.session_path.glob('alf/FOV_??'))
             if not collections:
@@ -254,8 +301,106 @@ def qc_session(eid, one=None, **kwargs):
             for collection in collections:
                 qc = MesoscopeQC(collection.name, one=one, endpoint='fields-of-view')
                 qc.session_path = session_qc.session_path
-                outcomes, extended = qc.run(update=False)
-                # TODO Log or store outcomes for each FOV
+                fov_qcs[f'alf/{collection.name}'] = qc.run(update=update)
+
+        # TODO Log or store outcomes for each FOV
+        return fov_qcs
+
+
+def update_dataset_qc_for_session(eid, qc, registered_datasets, one, override=False):
+    """
+    Update QC values for individual datasets associated to a session
+
+    Parameters
+    ----------
+    eid: str or UUID
+        The session identifier
+    qc : dict
+        Output from running MesoscopeQC.qc_session
+    registered_datasets : list of dict
+        A list of Alyx dataset records.
+    one : one.api.OneAlyx
+        An online instance of ONE.
+    override : bool
+        If True the QC field is updated even if new value is better than previous.
+
+    Returns
+    -------
+    dict of lists
+        For each collection in the qc returns a list of associated datasets that had their qc updated
+    """
+    datasets = {}
+    for collection in qc.keys():
+        reg_dsets = [d for d in registered_datasets if d['collection'] == collection]
+        dsets = update_dataset_qc_for_collection(eid, collection, qc[collection][3], reg_dsets, one, override=override)
+        datasets[collection] = dsets
+
+    return datasets
+
+
+def update_dataset_qc_for_collection(eid, collection, dataset_qc, registered_datasets, one, override=False):
+    """
+    Update QC values for individual datasets associated to a collection (normally 'alf/FOV_??')
+
+    Parameters
+    ----------
+    eid: str or UUID
+        The session identifier
+    collection: str
+        Collection that the datasets belong to. Assumes the collection is the same for all datasets provided in
+        registered_datasets and dataset_qc.
+    dataset_qc : dict
+        A dictionary containing dataset name as keys and the associated qc as values
+    registered_datasets : list of dict
+        A list of Alyx dataset records.
+    one : one.api.OneAlyx
+        An online instance of ONE.
+    override : bool
+        If True the QC field is updated even if new value is better than previous.
+
+    Returns
+    -------
+    list of dict
+        The list of datasets with qcs updated with the 'qc' fields updated.
+    """
+
+    datasets = registered_datasets.copy()
+
+    # Create map of dataset name, sans extension, to dataset id
+    stem2id = {PurePosixPath(dset['name']).stem: dset.get('id') for dset in registered_datasets}
+    # Ensure dataset stems are unique
+    assert len(stem2id) == len(registered_datasets), 'ambiguous dataset names'
+
+    # If the dataset that we are updating is not part of the registered datasets we need to fetch the dataset info
+    extra_dsets = [k for k in dataset_qc if PurePosixPath(k).stem not in stem2id.keys()]
+    for extra in extra_dsets:
+        dset = one.alyx.rest('datasets', 'list', session=eid, name=extra, collection=collection)
+        if len(dset) == 0:
+            # If the dataset doesn't exist we continue
+            _log.debug('dataset %s not registered, skipping', extra)
+            continue
+        if len(dset) > 0:
+            # If multiple datasets find the default dataset
+            dset = next(d for d in dset if d['default_dataset'])
+
+        dset['id'] = dset['url'][-36:]
+        stem2id[PurePosixPath(dset['name']).stem] = dset['id']
+
+        datasets.append(dset)
+
+    # Work over map of dataset name to outcome and update the dataset qc
+    for name, outcome in dataset_qc.items():
+        # Check if dataset was registered to Alyx
+        if not (did := stem2id.get(PurePosixPath(name).stem)):
+            _log.debug('dataset %s not registered, skipping', name)
+            continue
+        # Update the dataset QC value on Alyx
+        if outcome > spec.QC.NOT_SET or override:
+            dset_qc = base.QC(did, one=one, log=_log, endpoint='datasets')
+            dset = next(x for x in datasets if did == x.get('id'))
+            dset['qc'] = dset_qc.update(outcome, namespace='', override=override).name
+
+    return datasets
 
 
 if __name__ == '__main__':
diff --git a/ibllib/tests/qc/test_mesoscope_qc.py b/ibllib/tests/qc/test_mesoscope_qc.py
new file mode 100644
index 000000000..c83988e31
--- /dev/null
+++ b/ibllib/tests/qc/test_mesoscope_qc.py
@@ -0,0 +1,174 @@
+import unittest
+from unittest import mock
+from ibllib.qc.mesoscope import MesoscopeQC, update_dataset_qc_for_collection
+import numpy as np
+from one.alf import spec
+from pathlib import Path
+from uuid import uuid4
+
+
+class TestMesoscopeQC(unittest.TestCase):
+
+    def setUp(self):
+        one = mock.MagicMock()
+        self.qc = MesoscopeQC('FOV_00', one=one, endpoint='fields-of-view')
+        self.qc.load_data = mock.MagicMock()
+
+    def test_only_dset(self):
+        out = self.qc.check_timestamps_consistency(only_dsets=True)
+        self.assertEqual(out, ['mpci.times.npy'])
+
+    def test_check_timestamps_pass(self):
+        self.qc.data = {'F': np.ones((10, 3)), 'times': np.ones(10)}
+        out = self.qc.check_timestamps_consistency()
+        self.assertEqual(out, spec.QC.PASS)
+
+    def test_check_timestamps_fail(self):
+        self.qc.data = {'F': np.ones((10, 3)), 'times': np.ones(8)}
+        out = self.qc.check_timestamps_consistency()
+        self.assertEqual(out, spec.QC.FAIL)
+
+    @mock.patch('ibllib.qc.mesoscope.get_neural_quality_metrics')
+    def test_run(self, mock_neural_quality_metrics):
+        # We provide data such that the check_timestamps will fail
+        self.qc.data = {'F': np.ones((10, 3)), 'times': np.ones(8)}
+
+        # TODO change once actual thresholds are being applied
+        mock_neural_quality_metrics.return_value = {}, {}
+
+        out, metrics, dsets = self.qc.run()
+
+        # TODO change if dependent on other qc tests
+        self.assertEqual(out, spec.QC.FAIL)
+        self.assertEqual(len(dsets), 4)
+        # TODO update datasets as necessary with checks
+        for name in ['mpci.ROIActivityF.npy', 'mpci.ROINeuropilActivityF.npy', 'mpciROIs.mpciROITypes.npy']:
+            self.assertEqual(dsets.get(name), spec.QC.WARNING)
+
+        # Make sure for the mpci.times we get the worst of the qc values available
+        self.assertEqual(dsets['mpci.times.npy'], spec.QC.FAIL)
+
+
+class TestMesoscopeSessionQC(unittest.TestCase):
+
+    def setUp(self):
+        self.one = mock.MagicMock()
+        self.one.offline = False
+
+    @mock.patch('ibllib.qc.base.QC.update')
+    @mock.patch('ibllib.qc.mesoscope.MesoscopeQC.update')
+    @mock.patch('ibllib.qc.mesoscope.MesoscopeQC.run')
+    def test_session_qc(self, meso_qc, meso_update, base_update):
+
+        names = [{'name': 'FOV_00'}, {'name': 'FOV_01'}, {'name': 'FOV_02'}]
+
+        def rest_function(*args, **kwargs):
+            # This gets the rest method
+            method = args[1]
+            if method == 'list':
+                return [{'id': str(uuid4()), 'name': 'FOV_00'}, {'id': str(uuid4()), 'name': 'FOV_01'},
+                        {'id': str(uuid4()), 'name': 'FOV_02'},]
+            elif method == 'read':
+                return names.pop(0)
+            else:
+                return None
+
+        base_update.return_value = lambda *args, **kwargs: {'qc': spec.QC.NOT_SET.name,
+                                                            'json': {'extended_qc': None}}
+        meso_update.return_value = lambda *args, **kwargs: {'qc': spec.QC.NOT_SET.name,
+                                                            'json': {'extended_qc': None}}
+        meso_qc.side_effect = [(spec.QC.PASS, {}, []), (spec.QC.WARNING, {}, []), (spec.QC.WARNING, {}, [])]
+
+        self.one.list_collections.return_value = ['alf/FOV_00', 'alf/FOV_01', 'alf/FOV_02']
+        self.one.alyx.rest.side_effect = rest_function
+        self.one.eid2path.return_value = Path('/mnt/s0/Data/Subjects/SP054/2022-03-23/001')
+
+        out = MesoscopeQC.qc_session(str(uuid4()), self.one)
+        self.assertEqual(len(out), 3)
+        self.assertEqual(list(out.keys()), ['alf/FOV_00', 'alf/FOV_01', 'alf/FOV_02'])
+        self.assertEqual(out['alf/FOV_00'][0], spec.QC.PASS)
+        self.assertEqual(out['alf/FOV_01'][0], spec.QC.WARNING)
+        self.assertEqual(out['alf/FOV_02'][0], spec.QC.WARNING)
+
+
+class TestDatasetQC(unittest.TestCase):
+
+    def setUp(self):
+
+        self.one = mock.MagicMock()
+
+        self.list_datasets = [
+            [{'name': 'mpci.ROIActivityF.npy', 'qc': 'NOT_SET', 'url': f'lala/{str(uuid4())}', 'default_dataset': True}],
+            [{'name': 'mpci.ROINeuropilActivityF.npy', 'qc': 'NOT_SET', 'url': f'lala/{str(uuid4())}', 'default_dataset': True}],
+            [], []
+        ]
+
+        self.dataset_qc = {
+            'mpci.ROIActivityF.npy': spec.QC.WARNING,
+            'mpci.ROINeuropilActivityF.npy': spec.QC.PASS,
+            'mpciROIs.mpciROITypes.npy': spec.QC.WARNING,
+            'mpci.times.npy': spec.QC.PASS,
+        }
+
+        self.registered_datasets = [
+            {'name': 'mpci.times.npy', 'qc': 'NOT_SET', 'id': str(uuid4()), 'default_dataset': True},
+            {'name': 'mpciROIs.mpciROITypes.npy', 'qc': 'NOT_SET', 'id': str(uuid4()), 'default_dataset': True},
+        ]
+
+    def test_update_dataset_qc(self):
+        """Test task_metrics.update_dataset_qc function."""
+
+        def rest_function(*args, **kwargs):
+            # This gets the rest method
+            method = args[1]
+            if method == 'list':
+                return list_datasets.pop(0)
+            elif method == 'partial_update':
+                return kwargs.get('data')
+            else:
+                return None
+
+        self.one.alyx.rest.side_effect = rest_function
+        self.one.offline = False
+
+        # Test when no registered datasets, original dataset qc is NOT_SET and override=False
+        self.one.alyx.get.side_effect = lambda *args, **kwargs: {'qc': spec.QC.NOT_SET.name, 'json': {'extended_qc': None}}
+        list_datasets = self.list_datasets.copy()
+        out = update_dataset_qc_for_collection(str(uuid4()), 'alf/FOV_00',
+                                               self.dataset_qc, [], self.one, override=False)
+        self.assertEqual(len(out), 2)
+        self.assertEqual(next(o for o in out if o['name'] == 'mpci.ROIActivityF.npy')['qc'], spec.QC.WARNING.name)
+        self.assertEqual(next(o for o in out if o['name'] == 'mpci.ROINeuropilActivityF.npy')['qc'], spec.QC.PASS.name)
+
+        # Test when no registered datasets and  original dataset qc is FAIL and override=False
+        self.one.reset_mock()
+        self.one.alyx.get.side_effect = lambda *args, **kwargs: {'qc': spec.QC.FAIL.name, 'json': {'extended_qc': None}}
+        list_datasets = self.list_datasets.copy()
+        out = update_dataset_qc_for_collection(str(uuid4()), 'alf/FOV_00',
+                                               self.dataset_qc, [], self.one, override=False)
+        self.assertEqual(len(out), 2)
+        self.assertEqual(next(o for o in out if o['name'] == 'mpci.ROIActivityF.npy')['qc'], spec.QC.FAIL.name)
+        self.assertEqual(next(o for o in out if o['name'] == 'mpci.ROINeuropilActivityF.npy')['qc'], spec.QC.FAIL.name)
+
+        # Test when no registered datasets and  original dataset qc is FAIL and override=TRUE
+        self.one.reset_mock()
+        self.one.alyx.get.side_effect = lambda *args, **kwargs: {'qc': spec.QC.FAIL.name, 'json': {'extended_qc': None}}
+        list_datasets = self.list_datasets.copy()
+        out = update_dataset_qc_for_collection(str(uuid4()), 'alf/FOV_00',
+                                               self.dataset_qc, [], self.one, override=True)
+        self.assertEqual(len(out), 2)
+        self.assertEqual(next(o for o in out if o['name'] == 'mpci.ROIActivityF.npy')['qc'], spec.QC.WARNING.name)
+        self.assertEqual(next(o for o in out if o['name'] == 'mpci.ROINeuropilActivityF.npy')['qc'], spec.QC.PASS.name)
+
+        # Test when passing registered datasets
+        self.one.reset_mock()
+        self.one.alyx.get.side_effect = lambda *args, **kwargs: {'qc': spec.QC.NOT_SET.name,
+                                                                 'json': {'extended_qc': None}}
+        list_datasets = self.list_datasets.copy()[0:2]
+        out = update_dataset_qc_for_collection(str(uuid4()), 'alf/FOV_00',
+                                               self.dataset_qc, self.registered_datasets, self.one, override=True)
+        self.assertEqual(len(out), 4)
+
+
+if __name__ == '__main__':
+    unittest.main(exit=False, verbosity=2)

From 0a47c17696fcc0c2ad9bebb2a2b8da374f962884 Mon Sep 17 00:00:00 2001
From: Mayo Faulkner <mayo.faulkner@ucl.ac.uk>
Date: Thu, 3 Apr 2025 09:16:04 +0100
Subject: [PATCH 5/5] update qc to not set

---
 ibllib/qc/mesoscope.py               | 3 +--
 ibllib/tests/qc/test_mesoscope_qc.py | 2 +-
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/ibllib/qc/mesoscope.py b/ibllib/qc/mesoscope.py
index e4dcaf3f7..49a5ac8b5 100644
--- a/ibllib/qc/mesoscope.py
+++ b/ibllib/qc/mesoscope.py
@@ -251,8 +251,7 @@ def check_neural_quality(self, **kwargs):
         neural_metrics, fov_metrics = get_neural_quality_metrics(**self.data, **kwargs)
 
         # TODO Apply thresholds
-        return spec.QC.WARNING, neural_metrics  # Don't return fov_metric as this is one per cell which is large
-        # raise NotImplementedError
+        return spec.QC.NOT_SET, neural_metrics  # Don't return fov_metric as this is one per cell which is large
 
     @return_qc_datasets(['mpci.times.npy'])
     def check_timestamps_consistency(self, **kwargs):
diff --git a/ibllib/tests/qc/test_mesoscope_qc.py b/ibllib/tests/qc/test_mesoscope_qc.py
index c83988e31..bb4b46fcd 100644
--- a/ibllib/tests/qc/test_mesoscope_qc.py
+++ b/ibllib/tests/qc/test_mesoscope_qc.py
@@ -43,7 +43,7 @@ def test_run(self, mock_neural_quality_metrics):
         self.assertEqual(len(dsets), 4)
         # TODO update datasets as necessary with checks
         for name in ['mpci.ROIActivityF.npy', 'mpci.ROINeuropilActivityF.npy', 'mpciROIs.mpciROITypes.npy']:
-            self.assertEqual(dsets.get(name), spec.QC.WARNING)
+            self.assertEqual(dsets.get(name), spec.QC.NOT_SET)
 
         # Make sure for the mpci.times we get the worst of the qc values available
         self.assertEqual(dsets['mpci.times.npy'], spec.QC.FAIL)