rename Bernoulli UCB to Bounded UCB (rlberry-py#345)

lgtm
BorisHamadej · Jul 24, 2023 · ab39abd · ab39abd
1 parent 8b6b98f
commit ab39abd
Showing 1 changed file with 7 additions and 3 deletions.
diff --git a/examples/demo_bandits/plot_TS_bandit.py b/examples/demo_bandits/plot_TS_bandit.py
@@ -4,6 +4,10 @@
 =========================================================================
 
 This script shows how to use Thompson sampling on two examples: Bernoulli and Gaussian bandits.
+
+In the Bernoulli case, we use Thompson sampling with a Beta prior. We compare it to a UCB for
+bounded rewards with support in [0,1].
+For the Gaussian case, we use a Gaussian prior and compare it to a sub-Gaussian UCB.
 """
 
 import numpy as np
@@ -36,10 +40,10 @@ def __init__(self, env, **kwargs):
         self.env = WriterWrapper(self.env, self.writer, write_scalar="action")
 
 
-class BernoulliUCBAgent(IndexAgent):
+class BoundedUCBAgent(IndexAgent):
     """UCB agent for bounded bandits"""
 
-    name = "Bernoulli UCB Agent"
+    name = "Bounded UCB Agent"
 
     def __init__(self, env, **kwargs):
         index, _ = makeBoundedUCBIndex(0, 1)
@@ -65,7 +69,7 @@ def __init__(self, env, **kwargs):
         fit_budget=T,
         n_fit=M,
     )
-    for Agent in [BernoulliUCBAgent, BernoulliTSAgent]
+    for Agent in [BoundedUCBAgent, BernoulliTSAgent]
 ]
 
 # Agent training