Coverage for ibllib/qc/base.py: 93%

1import logging (empty)

2from abc import abstractmethod (empty)

3from pathlib import Path (empty)

4from itertools import chain (empty)

6import numpy as np (empty)

7from one.api import ONE (empty)

8from one.alf import spec (empty)

10"""dict: custom sign off categories""" (empty)

11SIGN_OFF_CATEGORIES = {'neuropixel': ['raw', 'spike_sorting', 'alignment']} (empty)

14class QC: (empty)

15 """A base class for data quality control."""

17 def __init__(self, endpoint_id, one=None, log=None, endpoint='sessions'): (empty)

18 """

19 A base class for data quality control.

21 :param endpoint_id: Eid for endpoint. If using sessions can also be a session path

22 :param log: A logging.Logger instance, if None the 'ibllib' logger is used

23 :param one: An ONE instance for fetching and setting the QC on Alyx

24 :param endpoint: The endpoint name to apply qc to. Default is 'sessions'

25 """

26 self.one = one or ONE() 17 ctx1cghiejfmdanpqorsb

27 self.log = log or logging.getLogger(__name__) 17 ctx1cghiejfmdanpqorsb

28 if endpoint == 'sessions': 17 ctx1cghiejfmdanpqorsb

29 self.endpoint = endpoint 11 ctx1cmdanpqorsb

30 self._set_eid_or_path(endpoint_id) 11 ctx1cmdanpqorsb

31 self.json = False 11 ctx1cmdanpqorsb

32 else:

33 self.endpoint = endpoint 10 ctx1cghiejfdab

34 self._confirm_endpoint_id(endpoint_id) 10 ctx1cghiejfdab

36 # Ensure outcome attribute matches Alyx record

37 updatable = self.eid and self.one and not self.one.offline 17 ctx1cghiejfmdanpqorsb

38 self._outcome = self.update('NOT_SET', namespace='') if updatable else spec.QC.NOT_SET 17 ctx1cghiejfmdanpqorsb

39 self.log.debug(f'Current QC status is {self.outcome}') 17 ctx1cghiejfmdanpqorsb

41 @abstractmethod (empty)

42 def run(self): (empty)

43 """Run the QC tests and return the outcome.

45 :return: One of "CRITICAL", "FAIL", "WARNING" or "PASS"

46 """

47 pass

49 @abstractmethod (empty)

50 def load_data(self): (empty)

51 """Load the data required to compute the QC.

53 Subclasses may implement this for loading raw data.

54 """

55 pass

57 @property (empty)

58 def outcome(self): (empty)

59 """one.alf.spec.QC: The overall session outcome."""

60 return self._outcome 19 ctx1cghiejfmldanpqorskb

62 @outcome.setter (empty)

63 def outcome(self, value): (empty)

64 value = spec.QC.validate(value) # ensure valid enum 8 ctx1cmanpqob

65 if self._outcome < value: 8 ctx1cmanpqob

66 self._outcome = value 1 ctx1m

68 @staticmethod (empty)

69 def overall_outcome(outcomes: iter, agg=max) -> spec.QC: (empty)

70 """

71 Given an iterable of QC outcomes, returns the overall (i.e. worst) outcome.

73 Example:

74 QC.overall_outcome(['PASS', 'NOT_SET', None, 'FAIL']) # Returns 'FAIL'

76 Parameters

77 ----------

78 outcomes : iterable of one.alf.spec.QC, str or int

79 An iterable of QC outcomes.

80 agg : function

81 Outcome code aggregate function, default is max (i.e. worst).

83 Returns

84 -------

85 one.alf.spec.QC

86 The overall outcome.

87 """

88 outcomes = filter(lambda x: x not in (None, np.NaN), outcomes) 20 ctx1wxyzABCDEdFanoGrsHkb

89 return agg(map(spec.QC.validate, outcomes)) 20 ctx1wxyzABCDEdFanoGrsHkb

91 def _set_eid_or_path(self, session_path_or_eid): (empty)

92 """Parse a given eID or session path.

94 If a session UUID is given, resolves and stores the local path and vice versa

95 :param session_path_or_eid: A session eid or path

96 :return:

97 """

98 self.eid = None 12 ctx1cvmdanpqorsb

99 if spec.is_uuid_string(str(session_path_or_eid)): 12 ctx1cvmdanpqorsb

100 self.eid = session_path_or_eid 3 ctx1cvm

101 # Try to set session_path if data is found locally

102 self.session_path = self.one.eid2path(self.eid) 3 ctx1cvm

103 elif spec.is_session_path(session_path_or_eid): 11 ctx1cvdanpqorsb

104 self.session_path = Path(session_path_or_eid) 11 ctx1cvdanpqorsb

105 if self.one is not None: 11 ctx1cvdanpqorsb

106 self.eid = self.one.path2eid(self.session_path) 11 ctx1cvdanpqorsb

107 if not self.eid: 11 ctx1cvdanpqorsb

108 self.log.warning('Failed to determine eID from session path') (empty)

109 else:

110 self.log.error('Cannot run QC: an experiment uuid or session path is required') 1 ctx1v

111 raise ValueError("'session' must be a valid session path or uuid") 1 ctx1v

112

113 def _confirm_endpoint_id(self, endpoint_id): (empty)

114 # Have as read for now since 'list' isn't working

115 target_obj = self.one.alyx.get(f'/{self.endpoint}/{endpoint_id}', clobber=True) or None 10 ctx1cghiejfdab

116 default_data = {} 10 ctx1cghiejfdab

117 if target_obj: 10 ctx1cghiejfdab

118 self.json = 'qc' not in target_obj 10 ctx1cghiejfdab

119 self.eid = endpoint_id 10 ctx1cghiejfdab

120 if self.json: 10 ctx1cghiejfdab

121 default_data['qc'] = 'NOT_SET' 7 ctx1cghiejf

122 if 'extended_qc' not in target_obj: 10 ctx1cghiejfdab

123 default_data['extended_qc'] = {} 10 ctx1cghiejfdab

124

125 if not default_data: 10 ctx1cghiejfdab

126 return # No need to set up JSON for QC

127 json_field = target_obj.get('json') 10 ctx1cghiejfdab

128 if not json_field or (self.json and not json_field.get('qc', None)): 10 ctx1cghiejfdab

129 self.one.alyx.json_field_update(endpoint=self.endpoint, uuid=self.eid, 6 ctx1cghiab

130 field_name='json', data=default_data)

131 else:

132 self.log.error('Cannot run QC: endpoint id is not recognised')

133 raise ValueError("'endpoint_id' must be a valid uuid")

134

135 def update(self, outcome=None, namespace='experimenter', override=False): (empty)

136 """Update the qc field in Alyx.

137

138 Updates the 'qc' field in Alyx if the new QC outcome is worse than the current value.

139

140 Parameters

141 ----------

142 outcome : str, int, one.alf.spec.QC

143 A QC outcome; one of "CRITICAL", "FAIL", "WARNING", "PASS" or "NOT_SET".

144 namespace : str

145 The extended QC key specifying the type of QC associated with the outcome.

146 override : bool

147 If True the QC field is updated even if new value is better than previous.

148

149 Returns

150 -------

151 one.alf.spec.QC

152 The current QC outcome on Alyx.

153

154 Example

155 -------

156 >>> qc = QC('path/to/session')

157 >>> qc.update('PASS') # Update current QC field to 'PASS' if not set

158 """

159 assert self.one, 'instance of one should be provided' 13 ctx1cghiejfmldakb

160 if self.one.offline: 13 ctx1cghiejfmldakb

161 self.log.warning('Running on OneOffline instance, unable to update remote QC')

162 return

163 outcome = spec.QC.validate(self.outcome if outcome is None else outcome) 13 ctx1cghiejfmldakb

164 assert self.eid, 'Unable to update Alyx; eID not set' 13 ctx1cghiejfmldakb

165 if namespace: # Record in extended qc 13 ctx1cghiejfmldakb

166 self.update_extended_qc({namespace: outcome.name}) 6 ctx1eflakb

167 details = self.one.alyx.get(f'/{self.endpoint}/{self.eid}', clobber=True) 13 ctx1cghiejfmldakb

168 current_status = (details['json'] if self.json else details)['qc'] 13 ctx1cghiejfmldakb

169 current_status = spec.QC.validate(current_status) 13 ctx1cghiejfmldakb

170

171 if current_status < outcome or override: 13 ctx1cghiejfmldakb

172 r = self.one.alyx.json_field_update(endpoint=self.endpoint, uuid=self.eid, 7 ctx1efldakb

173 field_name='json', data={'qc': outcome.name}) \

174 if self.json else self.one.alyx.rest(self.endpoint, 'partial_update', id=self.eid,

175 data={'qc': outcome.name})

176

177 current_status = spec.QC.validate(r['qc']) 7 ctx1efldakb

178 assert current_status == outcome, 'Failed to update session QC' 7 ctx1efldakb

179 self.log.info(f'QC field successfully updated to {outcome.name} for {self.endpoint[:-1]} ' 7 ctx1efldakb

180 f'{self.eid}')

181 self._outcome = current_status 13 ctx1cghiejfmldakb

182 return self.outcome 13 ctx1cghiejfmldakb

183

184 def update_extended_qc(self, data): (empty)

185 """Update the extended_qc field in Alyx.

186

187 Subclasses should chain a call to this.

188 :param data: a dict of qc tests and their outcomes, typically a value between 0. and 1.

189 :return: the updated extended_qc field

190 """

191 assert self.eid, 'Unable to update Alyx; eID not set' 12 ctx1ghiejfuldakb

192 assert self.one, 'instance of one should be provided' 12 ctx1ghiejfuldakb

193 if self.one.offline: 12 ctx1ghiejfuldakb

194 self.log.warning('Running on OneOffline instance, unable to update remote QC')

195 return

196

197 # Ensure None instead of NaNs

198 for k, v in data.items(): 12 ctx1ghiejfuldakb

199 if v is not None and not isinstance(v, str): 12 ctx1ghiejfuldakb

200 if isinstance(v, tuple): 11 ctx1ghiejfudakb

201 data[k] = tuple(None if not isinstance(i, str) and np.isnan(i) else i for i in v) 2 ctx1ab

202 else:

203 data[k] = None if np.isnan(v).all() else v 11 ctx1ghiejfudakb

204

205 details = self.one.alyx.get(f'/{self.endpoint}/{self.eid}', clobber=True) 12 ctx1ghiejfuldakb

206 if 'extended_qc' not in details: 12 ctx1ghiejfuldakb

207 extended_qc = details['json']['extended_qc'] or {} 9 ctx1ghiejfdab

208 extended_qc.update(data) 9 ctx1ghiejfdab

209 extended_qc_dict = {'extended_qc': extended_qc} 9 ctx1ghiejfdab

210 out = self.one.alyx.json_field_update( 9 ctx1ghiejfdab

211 endpoint=self.endpoint, uuid=self.eid, field_name='json', data=extended_qc_dict)

212 else:

213 extended_qc = details['extended_qc'] or {} 5 ctx1ulakb

214 extended_qc.update(data) 5 ctx1ulakb

215 out = self.one.alyx.json_field_update( 5 ctx1ulakb

216 endpoint=self.endpoint, uuid=self.eid, field_name='extended_qc', data=extended_qc)

217

218 self.log.info(f'Extended QC field successfully updated for {self.endpoint[:-1]} ' 12 ctx1ghiejfuldakb

219 f'{self.eid}')

220 return out 12 ctx1ghiejfuldakb

221

222 def compute_outcome_from_extended_qc(self) -> str: (empty)

223 """Return the session outcome computed from aggregating the extended QC."""

224 details = self.one.alyx.get(f'/{self.endpoint}/{self.eid}', clobber=True) 1 ctx1w

225 extended_qc = details['json']['extended_qc'] if self.json else details['extended_qc'] 1 ctx1w

226 return self.overall_outcome(v for k, v in extended_qc.items() or {} if k[0] != '_') 1 ctx1w

227

228

229def sign_off_dict(exp_dec, sign_off_categories=None): (empty)

230 """

231 Create sign off dictionary.

232

233 Creates a dict containing 'sign off' keys for each device and task protocol in the provided

234 experiment description.

235

236 Parameters

237 ----------

238 exp_dec : dict

239 A loaded experiment description file.

240 sign_off_categories : dict of list

241 A dictionary of custom JSON keys for a given device in the acquisition description file.

242

243 Returns

244 -------

245 dict of dict

246 The sign off dictionary with the main key 'sign_off_checklist' containing keys for each

247 device and task protocol.

248 """

249 # Note this assumes devices each contain a dict of dicts

250 # e.g. {'devices': {'DAQ_1': {'device_1': {}, 'device_2': {}},}

251 sign_off_categories = sign_off_categories or SIGN_OFF_CATEGORIES 3 ctx1tab

252 sign_off_keys = set() 3 ctx1tab

253 for k, v in exp_dec.get('devices', {}).items(): 3 ctx1tab

254 assert isinstance(v, dict) and v 3 ctx1tab

255 if len(v.keys()) == 1 and next(iter(v.keys())) == k: 3 ctx1tab

256 if k in sign_off_categories: 3 ctx1tab

257 for subkey in sign_off_categories[k]: 1 ctx1t

258 sign_off_keys.add(f'{k}_{subkey}') 1 ctx1t

259 else:

260 sign_off_keys.add(k) 3 ctx1tab

261 else:

262 for kk in v.keys(): 3 ctx1tab

263 if k in sign_off_categories: 3 ctx1tab

264 for subkey in sign_off_categories[k]: 1 ctx1t

265 sign_off_keys.add(f'{k}_{subkey}_{kk}') 1 ctx1t

266 else:

267 sign_off_keys.add(f'{k}_{kk}') 3 ctx1tab

268

269 # Add keys for each protocol

270 for i, v in enumerate(chain(*map(dict.keys, exp_dec.get('tasks', [])))): 3 ctx1tab

271 sign_off_keys.add(f'{v}_{i:02}') 3 ctx1tab

272

273 return {'sign_off_checklist': dict.fromkeys(map(lambda x: f'_{x}', sign_off_keys))} 3 ctx1tab