Ethan_misc/ideal_observer_stats.m at master · proektlab/Ethan_misc · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
function [acc, dprime, counts, thresh_info] = ideal_observer_stats(c1_values, c2_values, opts)
% Find maximum accuracy for decoding any 2 classes based on 1-dimensional values.
% If values are matrices, operates along the 2nd dimension (independently for each row).
% Data can be passed in 2 different ways:
%   - As a single matrix, with the boolean row vector or matrix is_class1 giving the class of each
%     column (if a matrix, different rows can have different classes);
%   - As 2 matrices c1_values and c2_values with the same number of rows.
% If weighted is true, weight to correct for bias in number of class 1 vs class 2 values.
% If weights is provided, it should be the same size as values (or [c1_values, c2_values]).
%   This overrides "weighted" in giving the weight for each sample and is not
%   further corrected for any nans in the data, except weights of nan values are set to 0 when
%   computing total weights. (Appropriate weights taking nans into account can be generated using
%   concat_and_weight_data.)
% If directed is true, assumes that the values are greater for class 1 than class 2;
%   otherwise the direction is determined from the data.
%
% Thresholds directly on (rather than between) the values are also considered, with an expected
% success rate of 0.5 * the number of tied samples with that value.
%
% When mutliple thresholds have the best accuracy, the difference between the class 1 and class 2
% accuracy is used as a tiebreaker (to minimize bias towards one class or the other). The same is
% true when considering positive vs. negative thresholds. If there is still a tie, the threshold is
% chosen at random among the candidates.
%
% counts contains the following additional info:
%   n_c1, n_c2: number of non-nan values in each class for each row
%   n_correct_c1, n_correct_c2: number of correctly-classified values in each class for each row
%   If weighted is true, acc = (n_correct_c1 / n_c1) + (n_correct_c2 / n_c2) / 2.
%   Otherwise, acc = (n_correct_c1 + n_correct_c2) / (n_c1 + n_c2).
%
% thresh_info contains the following additional info:
%   thresh: best threshold value for each row (can be -inf or inf)
%   b_invert: boolean indicating whether the best accuracy is obtained by classifying values
%       > the threshold as c2 (all false if directed is true).

arguments
    c1_values (:,:) double
    c2_values (:,:) double = [];
    opts.is_class1 (:,:) logical = logical.empty(0,0)
    opts.weighted (1,1) logical = false
    opts.directed (1,1) logical = false
    opts.weights double = []  % manual weights matrix, overrides opts.weighted
end

nrow = size(c1_values, 1);
if all(size(opts.is_class1) == 0)  % c2_values provided (or whole matrix is empty)
    assert(size(c2_values, 1) == nrow, 'Number of rows must match between class 1 and 2');
    values = [c1_values, c2_values];
    gt_c1 = [true(size(c1_values)), false(size(c2_values))];
else
    assert(all(size(c2_values) == 0), 'Cannot pass both c2_values and is_class1');
    values = c1_values;
    if ~isequal(size(values), size(opts.is_class1))
        if isvector(opts.is_class1) && length(opts.is_class1) == size(values, 2)
            gt_c1 = repmat(opts.is_class1(:)', nrow, 1);
        else
            error('Size of is_class1 must match values, or be a vector with the same # of columns');
        end
    else
        gt_c1 = opts.is_class1;
    end
end

maxobs = size(values, 2);

% number of actual data points to consider (non-NaN)
n1 = sum(~isnan(values) & gt_c1, 2);
n2 = sum(~isnan(values) & ~gt_c1, 2);
n = n1 + n2;

counts = struct;
counts.n_c1 = n1;
counts.n_c2 = n2;

if nrow == 0
    acc = zeros(0, 1);
    dprime = zeros(0, 1);
    counts.n_correct_c1 = zeros(0, 1);
    counts.n_correct_c2 = zeros(0, 1);
    thresh_info = struct('thresh', zeros(0, 1), 'b_invert', logical.empty(0, 1));
    return;
end

% make weights for each sample
if size(opts.weights, 1) > 0
    assert(isequal(size(opts.weights), size(values)), 'weights must have same size as values');
    weights = opts.weights;
else
    if opts.weighted
        % make weights matrix that weights classes inversely to their prevalence (for each row)
        weights = zeros(nrow, maxobs);
        [row_ind_c1, ~] = find(gt_c1);
        weights(gt_c1) = n2(row_ind_c1); % instead of 1 ./ n1 - avoid small floating point errors
        [row_ind_c2, ~] = find(~gt_c1);
        weights(~gt_c1) = n1(row_ind_c2);
    else
        weights = ones(nrow, maxobs);
    end
end

weights(isnan(values)) = 0;

% obtain a boolean matrix of whether each observation is in class 1,
% sorted by observation value for each row independently
% NaNs go at the end and won't be considered (masked by b_valid)
[sorted_values, sortorder] = sort(values, 2, MissingPlacement="last");
inds = sub2ind(size(gt_c1), repmat((1:nrow)', 1, maxobs), sortorder);
gt_c1 = gt_c1(inds);
b_valid = (1:maxobs) <= n; % matrix same size as gt_c1
% sort the weights as well
weights = weights(inds);

% TODO fix the rest of this by accumulating weighted n wrong

% scalar best values for each row
min_w_wrong = inf(nrow, 1);
min_acc_diff = ones(nrow, 1);
all_best = struct(...
    ... 1xn arrays for each best threshold
    'switch_inds', repmat({zeros(1,0)}, nrow, 1), ...
    'thresholds', repmat({zeros(1,0)}, nrow, 1), ...
    'n_wrong_c1', repmat({zeros(1,0)}, nrow, 1), ...
    'n_wrong_c2', repmat({zeros(1,0)}, nrow, 1), ...
    'b_invert', repmat({logical.empty(1,0)}, nrow, 1));


    function update_improved_rows(row_inds, n_wrong_c1, n_wrong_c2, w_wrong, switch_inds, thresholds, b_invert)
        % test whether the rows at row_inds are improved given n_wrong values
        % and update min_w_wrong, min_acc_diff, and all_best for improved and tied rows.
        row_inds = reshape(row_inds, 1, []);
        these_w_wrong = w_wrong(row_inds, 1);
        acc_diff = abs(n_wrong_c1(row_inds, 1) ./ n1(row_inds, 1) - n_wrong_c2(row_inds, 1) ./ n2(row_inds, 1));

        b_improve = false(length(row_inds), 1);
        b_tie = false(length(row_inds), 1);
        b_worse_w = these_w_wrong > min_w_wrong(row_inds, 1);
        if all(b_worse_w)
            return
        end

        b_tie_w = these_w_wrong == min_w_wrong(row_inds, 1);
        if any(b_tie_w)
            acc_diff_tie = acc_diff(b_tie_w);
            b_tie(b_tie_w) = acc_diff_tie == min_acc_diff(row_inds(b_tie_w), 1);
            b_improve(b_tie_w) = acc_diff_tie < min_acc_diff(row_inds(b_tie_w), 1);
        end

        b_improve(these_w_wrong < min_w_wrong(row_inds, 1)) = true;

        % update minima
        min_w_wrong(row_inds(b_improve)) = these_w_wrong(b_improve);
        min_acc_diff(row_inds(b_improve)) = acc_diff(b_improve);

        % update all_best for improved and tied rows
        if isscalar(switch_inds)
            switch_inds = repmat(switch_inds, nrow, 1);
        end

        for kR = row_inds(b_improve)
            all_best(kR).switch_inds = switch_inds(kR);
            all_best(kR).thresholds = thresholds(kR);
            all_best(kR).n_wrong_c1 = n_wrong_c1(kR);
            all_best(kR).n_wrong_c2 = n_wrong_c2(kR);
            all_best(kR).b_invert = b_invert;
        end

        for kR = row_inds(b_tie)
            all_best(kR).switch_inds(1, end+1) = switch_inds(kR);
            all_best(kR).thresholds(1, end+1) = thresholds(kR);
            all_best(kR).n_wrong_c1(1, end+1) = n_wrong_c1(kR);
            all_best(kR).n_wrong_c2(1, end+1) = n_wrong_c2(kR);
            all_best(kR).b_invert(1, end+1) = b_invert;
        end
    end

% start by categorizing all as class 1
% slightly hacky method, keep track of best case for positive and negative threshold
% simulatneously and resolve for each row at the end
% w = "weighted number"
n_wrong_c1_pos = zeros(nrow, 1);
n_wrong_c2_pos = n2;
w_wrong_pos = sum(weights .* ~gt_c1, 2);

% same but if we put the threshold on the value
% (resets to the between-value threshold value when not in the middle of a tie)
n_wrong_c1_pos_onval = n_wrong_c1_pos;
n_wrong_c2_pos_onval = n_wrong_c2_pos;
w_wrong_pos_onval = w_wrong_pos;
kT_onval = zeros(nrow, 1);

% as a special case, if sum of weights is 0, set threshold to nan rather than -inf
start_thresh = nan(nrow, 1);
start_thresh(sum(weights, 2) > 0) = -inf;

update_improved_rows(1:nrow, n_wrong_c1_pos, n_wrong_c2_pos, w_wrong_pos, ...
    zeros(nrow, 1), start_thresh, false);

if ~opts.directed
    % if we categorize them all as class 2 (negative threshold)
    n_wrong_c1_neg = n1;
    n_wrong_c2_neg = zeros(nrow, 1);
    w_wrong_neg = sum(weights .* gt_c1, 2);

    n_wrong_c1_neg_onval = n_wrong_c1_neg;
    n_wrong_c2_neg_onval = n_wrong_c2_neg;
    w_wrong_neg_onval = w_wrong_neg;

    update_improved_rows(1:nrow, n_wrong_c1_neg, n_wrong_c2_neg, w_wrong_neg, ...
        zeros(nrow, 1), start_thresh, true);
end

for kT = 1:maxobs
    % if we have a tie with the next value, still update n_wrong but don't consider updating
    % all_best until all identical values have been considered
    if kT == maxobs
        istie = false(nrow, 1);
    else
        istie = kT < n & sorted_values(:, kT) == sorted_values(:, kT + 1);
    end
    b_update = ~istie & b_valid(:, kT);
    update_inds = reshape(find(b_update), [], 1); % handle empty array correctly
    kT_onval = kT_onval + 0.5;

    % compute past-value thresholds
    thresholds = inf(nrow, 1);
    if any(kT < n)  % needed to guard against out-of-bounds indexing
        thresholds(kT < n) = mean(sorted_values(kT < n, [kT, kT+1]), 2);
    end

    % what changes by categorizing this one as class 2
    was_c1 = b_valid(:, kT) & gt_c1(:, kT);
    was_c2 = b_valid(:, kT) & ~gt_c1(:, kT);

    n_wrong_c1_pos(was_c1) = n_wrong_c1_pos(was_c1) + 1;
    w_wrong_pos(was_c1) = w_wrong_pos(was_c1) + weights(was_c1, kT);
    n_wrong_c2_pos(was_c2) = n_wrong_c2_pos(was_c2) - 1;
    w_wrong_pos(was_c2) = w_wrong_pos(was_c2) - weights(was_c2, kT);

    % also consider putting the threshold directly on this value
    n_wrong_c1_pos_onval(was_c1) = n_wrong_c1_pos_onval(was_c1) + 0.5;
    w_wrong_pos_onval(was_c1) = w_wrong_pos_onval(was_c1) + 0.5 .* weights(was_c1, kT);
    n_wrong_c2_pos_onval(was_c2) = n_wrong_c2_pos_onval(was_c2) - 0.5;
    w_wrong_pos_onval(was_c2) = w_wrong_pos_onval(was_c2) - 0.5 .* weights(was_c2, kT);

    % update all_best
    if any(b_update)
        update_improved_rows(update_inds, n_wrong_c1_pos, n_wrong_c2_pos, w_wrong_pos, kT, thresholds, false);
        update_improved_rows(update_inds, n_wrong_c1_pos_onval, n_wrong_c2_pos_onval, w_wrong_pos_onval, ...
            kT_onval, sorted_values(:, kT), false);
    end

    if ~opts.directed
        % try negative classifier
        % what changes by categorizing this one as class 1
        n_wrong_c2_neg(was_c2) = n_wrong_c2_neg(was_c2) + 1;
        w_wrong_neg(was_c2) = w_wrong_neg(was_c2) + weights(was_c2, kT);
        n_wrong_c1_neg(was_c1) = n_wrong_c1_neg(was_c1) - 1;
        w_wrong_neg(was_c1) = w_wrong_neg(was_c1) - weights(was_c1, kT);

        % consider putting the threshold directly on value
        n_wrong_c2_neg_onval(was_c2) = n_wrong_c2_neg_onval(was_c2) + 0.5;
        w_wrong_neg_onval(was_c2) = w_wrong_neg_onval(was_c2) + 0.5 .* weights(was_c2, kT);
        n_wrong_c1_neg_onval(was_c1) = n_wrong_c1_neg_onval(was_c1) - 0.5;
        w_wrong_neg_onval(was_c1) = w_wrong_neg_onval(was_c1) - 0.5 .* weights(was_c1, kT);

        if any(b_update)
            update_improved_rows(update_inds, n_wrong_c1_neg, n_wrong_c2_neg, w_wrong_neg, kT, thresholds, true);
            update_improved_rows(update_inds, n_wrong_c1_neg_onval, n_wrong_c2_neg_onval, w_wrong_neg_onval, ...
                kT_onval, sorted_values(:, kT), true);
        end
    end

    % reset onval counts for valid values that are not ties
    kT_onval(~istie) = kT;
    n_wrong_c1_pos_onval(~istie) = n_wrong_c1_pos(~istie);
    n_wrong_c2_pos_onval(~istie) = n_wrong_c2_pos(~istie);
    w_wrong_pos_onval(~istie) = w_wrong_pos(~istie);

    if ~opts.directed
        n_wrong_c1_neg_onval(~istie) = n_wrong_c1_neg(~istie);
        n_wrong_c2_neg_onval(~istie) = n_wrong_c2_neg(~istie);
        w_wrong_neg_onval(~istie) = w_wrong_neg(~istie);
    end
end

% select results - if there are ties, randomly select among them.
n_found = arrayfun(@(s_best) numel(s_best.thresholds), all_best);
ind_to_take = ceil(rand(nrow, 1) .* n_found);

best_switch = arrayfun(@(s_best, ind) s_best.switch_inds(ind), all_best, ind_to_take);
best_thresh = arrayfun(@(s_best, ind) s_best.thresholds(ind), all_best, ind_to_take);
best_n_wrong_c1 = arrayfun(@(s_best, ind) s_best.n_wrong_c1(ind), all_best, ind_to_take);
best_n_wrong_c2 = arrayfun(@(s_best, ind) s_best.n_wrong_c2(ind), all_best, ind_to_take);
b_invert = arrayfun(@(s_best, ind) s_best.b_invert(ind), all_best, ind_to_take);

acc = 1 - min_w_wrong ./ sum(weights, 2);
counts.n_correct_c1 = counts.n_c1 - best_n_wrong_c1;
counts.n_correct_c2 = counts.n_c2 - best_n_wrong_c2;

% compute sensitivity as well, using RMS SD (conservative estimate)
best_n1 = zeros(nrow, 1);
n_hits = zeros(nrow, 1);
best_n1(b_invert) = best_switch(b_invert);
best_n1(~b_invert) = n(~b_invert) - best_switch(~b_invert);
n_hits(b_invert) = sum(gt_c1(b_invert, :) & b_valid(b_invert, :) & (1:maxobs) <= best_switch(b_invert, :), 2);
n_hits(~b_invert) = sum(gt_c1(~b_invert, :) & b_valid(~b_invert, :) & (1:maxobs) > best_switch(~b_invert, :), 2);
n_fa = best_n1 - n_hits;

hit_rate = n_hits ./ n1;
fa_rate = n_fa ./ n2;
z_hit = norminv(hit_rate);
z_fa = norminv(fa_rate);

sd_c1 = arrayfun(@(kR) std(values(kR, gt_c1(kR, :)), "omitmissing"), (1:nrow)');
sd_c2 = arrayfun(@(kR) std(values(kR, ~gt_c1(kR, :)), "omitmissing"), (1:nrow)');
mean_diff = sd_c1 .* z_hit - sd_c2 .* z_fa;

rms_sd = sqrt((sd_c1.^2 + sd_c2.^2) ./ 2);
dprime = mean_diff ./ rms_sd;

thresh_info = struct('thresh', best_thresh, 'b_invert', b_invert);

end