dreyevr_recording_analyzer/ibmm.py at main · HARPLab/dreyevr_recording_analyzer · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
#!/usr/bin/env python

import sklearn.mixture
import sklearn.metrics.pairwise
import numpy as np
import pandas as pd
import collections

class Options(collections.Mapping):
    @classmethod
    def keys(cls):
        return cls.__slots__
    def __getitem__(self, key):
        return getattr(self, key)
    def __setitem__(self, key, val):
        setattr(self, key, val)
    @classmethod
    def __iter__(cls):
        return iter(cls.__slots__)
    @classmethod
    def __len__(cls):
        return len(cls.__slots__)
    def __repr__(self):
        return '{}({})'.format(self.__class__.__name__, dict(self))

class EyeClassifier:
    LABEL_FIX = 0
    LABEL_SAC = 1
    LABEL_NOISE = -1

    def __init__(self, **kwargs):

        self.eye_models = (sklearn.mixture.BayesianGaussianMixture(n_components=2, weight_concentration_prior_type='dirichlet_distribution', **kwargs),
                           sklearn.mixture.BayesianGaussianMixture(n_components=2, weight_concentration_prior_type='dirichlet_distribution', **kwargs))
        self.eye_labels = None
        self.world_model = sklearn.mixture.BayesianGaussianMixture(n_components=2, weight_concentration_prior_type='dirichlet_distribution', **kwargs)
        self.world_labels = None

    class PreprocessOptions(Options):
        __slots__ = ('dist_method', 'conf_threshold', 'smoothing')
        __ros_name__ = 'preprocess_options'
        def __init__(self, **kwargs):
            self.dist_method = kwargs.get('dist_method') or 'vector'
            self.conf_threshold = kwargs.get('conf_threshold') or 0.8
            self.smoothing = kwargs.get('smoothing') or 'none'

    @staticmethod
    def preprocess(data, dist_method='vector', conf_thresh=0.8, smoothing='none'):
        """
        Preprocess input x/y positions to get pairwise distances and remove low-confidence values

        Keyword arguments:
        data -- Input pandas-style dataframe with columns 'timestamp', 'confidence', 'x', 'y', optionally 'z' (ignored if method is 'euclidean', used if method is 'vector' and set to 1.0 if missing)
        dist_method -- 'vector' (compute angle between eye rays) or 'euclidean' (compute euclidean distance)
        conf_threshold -- valid confidence to accept
        smoothing -- preprocessing of signal to smooth values, options currently only include 'none'

        Returns:
        a pandas dataframe with columns 'timestamp', 'velocity' (which may be nan, corresponding to noise)
        """
        # Validate arguments
        DIST_METHOD_VECTOR = 'vector'
        DIST_METHOD_EUC = 'euclidean'
        DIST_METHODS = [DIST_METHOD_VECTOR, DIST_METHOD_EUC]
        if dist_method not in DIST_METHODS:
            raise ValueError('Unrecognized distance method {}, must be one of {}'.format(dist_method, DIST_METHODS))

        SMOOTHING_NONE = 'none'
        SMOOTHINGS = [SMOOTHING_NONE]
        if smoothing not in SMOOTHINGS:
            raise ValueError('Unrecognized smoothing method {}, must be one of {}'.format(smoothing, SMOOTHINGS))

        if np.any(np.diff(data['timestamp']) <= 0.):
            raise ValueError('Timestamps identical or out of sequence')

        # Data extraction
        if 'z' in data.columns and dist_method == DIST_METHOD_VECTOR:
            pos = data.loc[:, ['x','y','z']].values
        elif dist_method == DIST_METHOD_VECTOR:
            pos = np.hstack( (data.loc[:, ['x','y']].values, np.ones( (len(data), 1) )) )
        elif dist_method == DIST_METHOD_EUC:
            pos = data.loc[:, ['x','y']].values
        else:
            raise RuntimeError("unreachable")

        # fail if no data
        if pos.shape[0] < 2:
            return pd.DataFrame({'timestamp': data.timestamp, 'velocity': np.full(pos.shape[0], np.nan)})

        # TODO: smoothing


        # Compute velocity
        if dist_method == DIST_METHOD_VECTOR:
            sdist = sklearn.metrics.pairwise.paired_cosine_distances(pos[1:,:], pos[:-1,:])
            # Clamp to handle numeric errors
            sdist[sdist > 1.] = 1.
            sdist[sdist < -1.] = -1.
            dist = np.arcsin(sdist)
        elif dist_method == DIST_METHOD_EUC:
            dist = sklearn.metrics.pairwise.paired_euclidean_distances(pos[1:,:], pos[:-1,:])
        else:
            raise RuntimeError("unreachable")
        dt = np.diff(data['timestamp'].values)

        veloc = dist / dt

        # Remove low-confidence values
        veloc[ np.logical_or(data.confidence.values[1:] < conf_thresh,
                             data.confidence.values[:-1] < conf_thresh) ] = np.nan
        # add a nan value at the beginning so the data point count remains the same
        veloc = np.concatenate( ([np.nan], veloc) )

        return pd.DataFrame({'timestamp': data['timestamp'], 'velocity': veloc}, index=data.index)

    @staticmethod
    def _fit(model, data):
        model.fit(data.loc[np.logical_not(pd.isnull(data['velocity'])), 'velocity'].values.reshape(-1,1))

    def fit(self, eyes=None, world=None):
        """
        Fit the bayesian mixture models for each eye.

        Arguments:
        eyes -- An iterable of length 1 or 2, including preprocessed data (in the format output by preprocess() ), of eye positions
        world -- Preprocessed world positions
        """
        if eyes is not None:
            if len(eyes) > 0:
                EyeClassifier._fit(self.eye_models[0], eyes[0])
                if self.eye_models[0].means_[0] < self.eye_models[0].means_[1]:
                    self.eye_labels = [np.array([EyeClassifier.LABEL_FIX, EyeClassifier.LABEL_SAC])]
                else:
                    self.eye_labels = [np.array([EyeClassifier.LABEL_SAC, EyeClassifier.LABEL_FIX])]
            if len(eyes) > 1:
                EyeClassifier._fit(self.eye_models[1], eyes[1])
                if self.eye_models[1].means_[0] < self.eye_models[1].means_[1]:
                    self.eye_labels.append(np.array([EyeClassifier.LABEL_FIX, EyeClassifier.LABEL_SAC]))
                else:
                    self.eye_labels.append(np.array([EyeClassifier.LABEL_SAC, EyeClassifier.LABEL_FIX]))

        if world is not None:
            EyeClassifier._fit(self.world_model, world)
            if self.world_model.means_[0] < self.world_model.means_[1]:
                self.world_labels = np.array([EyeClassifier.LABEL_FIX, EyeClassifier.LABEL_SAC])
            else:
                self.world_labels = np.array([EyeClassifier.LABEL_SAC, EyeClassifier.LABEL_FIX])

    @staticmethod
    def _predict(model, model_labels, data):
        labels = np.ones(len(data), dtype=np.int8)*EyeClassifier.LABEL_NOISE
        valid_mask = np.logical_not(pd.isnull(data['velocity']))
        if np.any(valid_mask):
            labels[valid_mask] = model_labels[model.predict(data.loc[valid_mask, 'velocity'].values.reshape(-1,1))]
        return labels

    @staticmethod
    def postprocess(labels, noise_only=True):
        """
        Post-process label assignments to clean up noise related stuff.

        For now, all this does is finds sequences ABA where B != A, A != noise, and converts them to AAA.

        This could be more sophisticated someday.
        """
        if len(labels) <= 2:
            # not enough context to fix anything
            return labels

        if noise_only:
            labels_to_fix = np.logical_and(
                np.logical_and(labels[0:-2] == labels[2:], labels[1:-1] == EyeClassifier.LABEL_NOISE),
                labels[0:-2] != EyeClassifier.LABEL_NOISE)
        else:
            labels_to_fix = np.logical_and(
                np.logical_and(labels[0:-2] == labels[2:], labels[1:-1] != labels[0:-2] ),
                labels[0:-2] != EyeClassifier.LABEL_NOISE)
        indices = np.flatnonzero(labels_to_fix)
        labels[indices+1] = labels[indices]
        return labels

    @staticmethod
    def _fuse_local(cur_labels):
        ct_sac = np.count_nonzero(cur_labels == EyeClassifier.LABEL_SAC)
        ct_fix = np.count_nonzero(cur_labels == EyeClassifier.LABEL_FIX)

        ct_nse = np.count_nonzero(cur_labels == EyeClassifier.LABEL_NOISE)

        if ct_sac > 0:
            lbl = EyeClassifier.LABEL_SAC
        elif ct_fix > 0:
            lbl = EyeClassifier.LABEL_FIX
        elif len(cur_labels) == 0:
            # no data at all, so just hold from the last one
            # likely we're sampling faster than the actual data we have
            lbl = None
        else:
            lbl = EyeClassifier.LABEL_NOISE

        return lbl, {'ct_sac': ct_sac, 'ct_nse': ct_nse, 'ct_fix': ct_fix}

    @staticmethod
    def fuse(labels, ts=None, dt=None):
        """
        Fuse different label sets to come to an agreement.

        Algorithm, roughly:
            For each period n*dt - (n+1)*dt:
                Find labels from each set within the period
                Result label = majority vote among SAC, FIX; NSE if all are noise; break ties as SAC

        Arguments:
        labels -- Iterable of pandas-style dataframe with columns 'timestamp' and 'label'
        ts -- list of timestamps to sample at, or None to use automatic samples from dt
        dt -- sampling period to use, if ts is None

        Returns:
        pandas DataFrame with columns:
            timestamp -- ts or times generated from dt
            label -- the fused labels
        """
        if ts is None and dt is not None:
            ts = np.arange( labels.timestamp.values[0], labels.timestamp.values[-1], dt)
            if ts[-1] < labels.timestamp.values[-1]:
                ts = np.hstack((ts, labels.timestamp.values[-1]))
        if ts is not None:
            fused_labels = np.full(ts.shape, EyeClassifier.LABEL_NOISE, dtype=np.int8)
            cts_sac = np.zeros(ts.shape, dtype=np.int8)
            cts_fix = np.zeros(ts.shape, dtype=np.int8)
            cts_nse = np.zeros(ts.shape, dtype=np.int8)
            for idx in range(ts.size):
                tprev = ts[idx]
                tnext = ts[idx+1] if idx < ts.size-1 else np.inf
                cur_labels = labels[np.logical_and(labels.timestamp >= tprev, labels.timestamp < tnext)]

                label, cts = EyeClassifier._fuse_local(cur_labels)

                cts_sac[idx] = cts['ct_sac']
                cts_fix[idx] = cts['ct_fix']
                cts_nse[idx] = cts['ct_nse']

                if label is not None:
                    fused_labels[idx] = label
                elif idx > 0:
                    fused_labels[idx] = fused_labels[idx-1]
        else:
            sorted_idx = np.argsort(labels.timestamp.values)
            ts = labels.timestamp.values[sorted_idx]
            fused_labels = labels.label.values[sorted_idx]
            cts_fix = (fused_labels == EyeClassifier.LABEL_FIX).astype(np.int8)
            cts_sac = (fused_labels == EyeClassifier.LABEL_SAC).astype(np.int8)
            cts_nse = (fused_labels == EyeClassifier.LABEL_NOISE).astype(np.int8)

        # Fix length-one holes
        fused_labels = EyeClassifier.postprocess(fused_labels)

        data = pd.DataFrame({'timestamp': ts, 'label': fused_labels,
                             'count_fix': cts_fix,
                             'count_sac': cts_sac,
                             'count_nse': cts_nse})
        data.index.name = 'id'
        return data


    def predict(self, eyes=None, world=None, ts=None, dt=None, fuse=True):
        """
        Predict labels from a collection of data.

        First predicts the labels for each type of data from the internal model. Then fuses the data, as described in fuse().

        Arguments:
        eyes -- 1- or 2-length iterable of eye data, in the format output by preprocess() above, or None
        world -- Eye data in the world frame, in the format output by preprocess() above, or None
        ts -- Timestamps to use, or None. See fuse() for logic.
        dt -- Time period to use, or None. See fuse() for logic.

        Returns:
        Tuple of (fused_data, iterable of labels found)
        """
        data_to_fuse = []
        if eyes is not None:
            if len(eyes) > 0:
                labels0 = EyeClassifier._predict(self.eye_models[0], self.eye_labels[0], eyes[0])
                labels0 = EyeClassifier.postprocess(labels0)
                data_to_fuse.append(pd.DataFrame({'timestamp': eyes[0].timestamp, 'label': labels0, 'source': 'eye0'}))
            if len(eyes) > 1:
                labels1 = EyeClassifier._predict(self.eye_models[1], self.eye_labels[1], eyes[1])
                labels1 = EyeClassifier.postprocess(labels1)
                data_to_fuse.append(pd.DataFrame({'timestamp': eyes[1].timestamp, 'label': labels1, 'source': 'eye1'}))

        if world is not None:
            labelsw = EyeClassifier._predict(self.world_model, self.world_labels, world)
            labelsw = EyeClassifier.postprocess(labelsw)
            data_to_fuse.append(pd.DataFrame({'timestamp': world.timestamp, 'label': labelsw, 'source': 'world'}))
        data_to_fuse = pd.concat(data_to_fuse).sort_values(by=['timestamp'])
        if fuse:
            return EyeClassifier.fuse(data_to_fuse, ts, dt), data_to_fuse
        else:
            return data_to_fuse

    @staticmethod
    def get_fixations_from_labels(labels, gaze_data=None, min_fix_dur=100, max_fix_dur=1000):
        """
        Convert a sequence of labels into detected fixations.

        Arguments:
        labels -- pandas-style dataframe with columns 'timestamp', 'label', as in supplied by EyeClassifier.fuse
        gaze_data -- Pandas-style dataframe with columns 'timestamp', 'x', 'y', or None. Fills out fixation 'x', 'y' if provided
        min_fix_dur -- minimum fixation duration to filter out (in ms), or None if no filtering is to be done
        max_fix_dur -- maximum fixation duration to divide into; fixations longer than this will be split into multiple fixations

        Returns:
        pandas dataframe of all detected fixations with columns 'start_timestamp', 'duration' (in ms). If gaze_data is provided, also
        includes columns 'x', 'y', which are the mean of the values of gaze_data.x and gaze_data.y for the duration of the fixation
        """

        # Fixations are periods of either "fixation" or "noise" that start and end with a fixation label
        # possibly there should be a limit to the amount of noise allowed within a fixation?
#         is_fix = np.logical_or(labels.label.values == EyeClassifier.LABEL_FIX,
#                                 labels.label.values == EyeClassifier.LABEL_NOISE).astype(np.int8)
        if len(labels) < 2:
            return pd.DataFrame([], columns=['start_timestamp', 'duration']), []

        is_fix = (labels.label.values == EyeClassifier.LABEL_FIX).astype(np.int8)
        fix_change = is_fix[1:] - is_fix[:-1]

        fix_start = np.flatnonzero(fix_change == 1) + 1
        fix_end = np.flatnonzero(fix_change == -1)
        if is_fix[0]:
            if is_fix[1]:
                # if there's a length-2 to start, make sure to mark it
                fix_start = np.concatenate( ([0], fix_start) )
            else:
                # if it's just length 1, remove it
                fix_end = fix_end[1:]
        if is_fix[-1]:
            if is_fix[-2]:
                fix_end = np.concatenate( (fix_end, [is_fix.size-1]))
            else:
                fix_start = fix_start[:-1]

        # Shrink fixation start and end periods to reject noise at the edges
#         def get_offset_idx(st,nd):
#             nse_idx = np.flatnonzero( labels.label.values[st:nd] != EyeClassifier.LABEL_NOISE )
#             if nse_idx.size > 0:
#                 return nse_idx[ [0,-1] ]
#             else:
#                 return [ nd-st, nd-st ]
#         noise_offsets = np.array([ get_offset_idx(st,nd) for st,nd in zip(fix_start, fix_end) ])
#         fix_end -= fix_end - fix_start - noise_offsets[:,1]
#         fix_start += noise_offsets[:,0]
        # now make sure we didn't overshoot (possible only if a "fixation" is entirely noise"
        ok_idx = fix_start < fix_end
        fix_start = fix_start[ok_idx]
        fix_end = fix_end[ok_idx]

        fix = pd.DataFrame( np.column_stack((labels.timestamp.values[fix_start],
                            (labels.timestamp.values[fix_end] - labels.timestamp.values[fix_start])* 1000.)),
                           columns=['start_timestamp', 'duration'])

        #Filter out too-short fixations
        if max_fix_dur is not None:
            fix_adj = []
            for f in fix.itertuples(index=False):
                while f.duration > max_fix_dur:
                    fix_adj.append(f._replace(duration=max_fix_dur))
                    f = f._replace(start_timestamp=f.start_timestamp+max_fix_dur*1e-3, duration=f.duration-max_fix_dur)
                fix_adj.append(f)
            fix = pd.DataFrame(fix_adj, columns=fix.columns)
        if min_fix_dur is not None:
            fix = fix.loc[fix.duration >= min_fix_dur, :]
            fix.index = np.arange(len(fix))

        if gaze_data is not None:
            gaze_raw = [gaze_data.loc[np.logical_and(gaze_data.timestamp.values >= r.start_timestamp,
                                                                       gaze_data.timestamp.values <= r.start_timestamp + .001*r.duration), ['timestamp', 'confidence', 'x','y']]
                        for r in fix.itertuples()]
            m_x = [ np.mean( raw.x ) for raw in gaze_raw ]
            m_y = [ np.mean( raw.y ) for raw in gaze_raw ]
            fix = fix.assign(x=m_x, y=m_y)
        else:
            gaze_raw = [pd.DataFrame()] * len(fix)
        fix.index.name = 'id'
        return fix, gaze_raw

    def get_fixations(self, eyes=None, world=None, ts=None, dt=None, gaze_data=None, min_fix_dur=100, max_fix_dur=1000):
        if ts is None and dt is None and gaze_data is not None:
            ts = gaze_data.timestamp.values
        labels, _ = self.predict(eyes=eyes, world=world, ts=ts, dt=dt)
        return EyeClassifier.get_fixations_from_labels(labels, gaze_data, min_fix_dur, max_fix_dur)