-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathepsilonGreedySelection.ts
More file actions
61 lines (49 loc) · 2.01 KB
/
epsilonGreedySelection.ts
File metadata and controls
61 lines (49 loc) · 2.01 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
import type { Test, Variant } from '../../shared/types';
import { putMetric } from '../utils/cloudwatch';
import { logError } from '../utils/logging';
import type { BanditData } from './banditData';
import { filterValidVariants, selectRandomVariant } from './helpers';
/**
* In general we select the best known variant, except with probability 'epsilon' when we select at random.
* https://en.wikipedia.org/wiki/Multi-armed_bandit#Semi-uniform_strategies
*/
export function selectVariantWithHighestMean<V extends Variant, T extends Test<V>>(
testBanditData: BanditData,
test: T,
): V | undefined {
const sortedVariants = filterValidVariants(testBanditData.sortedVariants, test);
// variants array is sorted by mean, use just the best variants
const bestMean = sortedVariants[0].mean;
const bestVariants = sortedVariants.findIndex((variant) => variant.mean < bestMean);
if (bestVariants === -1) {
// all variants are tied
return selectRandomVariant(test);
}
const variant =
bestVariants < 2
? sortedVariants[0]
: sortedVariants[Math.floor(Math.random() * bestVariants)]; // more than 1
return test.variants.find((v) => v.name === variant.variantName);
}
export function selectVariantUsingEpsilonGreedy<V extends Variant, T extends Test<V>>(
test: T,
epsilon: number,
testBanditData?: BanditData,
): V | undefined {
if (!testBanditData) {
// We don't yet have bandit data for this test, select a random variant
return selectRandomVariant(test);
}
// Choose at random with probability epsilon
const random = Math.random();
if (epsilon > random) {
return selectRandomVariant(test);
}
const highestMeanVariantData = selectVariantWithHighestMean<V, T>(testBanditData, test);
if (!highestMeanVariantData) {
logError(`Failed to select best variant for bandit test: ${test.name}`);
putMetric('bandit-selection-error');
return;
}
return highestMeanVariantData;
}