Refactored regret example

roycoding · roycoding · commit 7e2d36b1b673 · 2016-08-13T19:09:34.000-05:00
diff --git a/README.md b/README.md
@@ -72,36 +72,34 @@ import slots
 # Test multiple strategies for the same bandit probabilities
 probs = [0.4, 0.9, 0.8]
 
-ba = slots.MAB(probs=probs)
-bb = slots.MAB(probs=probs)
-bc = slots.MAB(probs=probs)
-bd = slots.MAB(probs=probs)
+strategies = [{'strategy': 'eps_greedy', 'regret': [],
+               'label': '$\epsilon$-greedy ($\epsilon$=0.1)'},
+              {'strategy': 'softmax', 'regret': [],
+               'label': 'Softmax ($T$=0.1)'},
+              {'strategy': 'ucb', 'regret': [],
+               'label': 'UCB1'},
+              {'strategy': 'bayesian', 'regret': [],
+               'label': 'Bayesian bandit'},
+              ]
+
+for s in strategies:
+ s['mab'] = slots.MAB(probs=probs)
 
 # Run trials and calculate the regret after each trial
-rega = []
-regb = []
-regc = []
-regd = []
 for t in range(10000):
-    ba._run('eps_greedy')
-    rega.append(ba.regret())
-    bb._run('softmax')
-    regb.append(bb.regret())
-    bc._run('ucb')
-    regc.append(bc.regret())
-    bd._run('bayesian')
-    regd.append(bd.regret())
-
+    for s in strategies:
+        s['mab']._run(s['strategy'])
+        s['regret'].append(s['mab'].regret())
 
 # Pretty plotting
 sns.set_style('whitegrid')
 sns.set_context('poster')
 
 plt.figure(figsize=(15,4))
-plt.plot(rega, label='$\epsilon$-greedy ($\epsilon$=0.1)')
-plt.plot(regb, label='Softmax ($T$=0.1)')
-plt.plot(regc, label='UCB')
-plt.plot(regd, label='Bayesian Bandit')
+
+for s in strategies:
+    plt.plot(s['regret'], label=s['label'])
+
 plt.legend()
 plt.xlabel('Trials')
 plt.ylabel('Regret')
diff --git a/misc/regret_plot.png b/misc/regret_plot.png
diff --git a/setup.py b/setup.py
@@ -16,7 +16,7 @@
 setup(
     name='slots',
 
-    version='0.1.0',
+    version='0.2.0',
 
     description='A multi-armed bandit library for Python',
     long_description=long_description,