Remove non-negativity restriction from beta

emdgroup · Feb 18, 2025 · 6d1e22b · 6d1e22b
1 parent 949b897
commit 6d1e22b
Show file tree

Hide file tree

Showing 3 changed files with 13 additions and 16 deletions.
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -20,6 +20,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 ## [0.12.2] - 2025-01-31
 ### Changed
 - More robust settings for the GP fitting
+- The `beta` parameter of `UCB` and `qUCB` can now also take negative values
 
 ## [0.12.1] - 2025-01-29
 ### Changed

diff --git a/baybe/acquisition/acqfs.py b/baybe/acquisition/acqfs.py
@@ -14,10 +14,8 @@
 from baybe.acquisition.base import AcquisitionFunction
 from baybe.searchspace import SearchSpace
 from baybe.utils.basic import classproperty
-from baybe.utils.sampling_algorithms import (
-    DiscreteSamplingMethod,
-    sample_numerical_df,
-)
+from baybe.utils.sampling_algorithms import DiscreteSamplingMethod, sample_numerical_df
+from baybe.utils.validation import finite_float
 
 
 ########################################################################################
@@ -267,9 +265,12 @@ class UpperConfidenceBound(AcquisitionFunction):
     beta: float = field(converter=float, validator=ge(0.0), default=0.2)
     """Trade-off parameter for mean and variance.
 
-    A value of zero makes the acquisition mechanism consider the posterior predictive
-    mean only, resulting in pure exploitation. Higher values shift the focus more and
-    more toward exploration.
+    * A value of zero makes the acquisition mechanism consider the posterior predictive
+      mean only, resulting in a risk-neutral behavior.
+    * Values larger than zero induce risk-seeking behavior, shifting the focus
+      more and more toward exploration.
+    * Values smaller than zero lead to favoring risk-averse decisions (a.k.a. "safe
+      bets"), with purely exploitative behavior in the limit.
     """
 
 
@@ -279,13 +280,8 @@ class qUpperConfidenceBound(AcquisitionFunction):
 
     abbreviation: ClassVar[str] = "qUCB"
 
-    beta: float = field(converter=float, validator=ge(0.0), default=0.2)
-    """Trade-off parameter for mean and variance.
-
-    A value of zero makes the acquisition mechanism consider the posterior predictive
-    mean only, resulting in pure exploitation. Higher values shift the focus more and
-    more toward exploration.
-    """
+    beta: float = field(converter=float, validator=finite_float, default=0.2)
+    """See :paramref:`UpperConfidenceBound.beta`."""
 
 
 @define(frozen=True)

diff --git a/tests/hypothesis_strategies/acquisition.py b/tests/hypothesis_strategies/acquisition.py
@@ -49,14 +49,14 @@ def _qNIPV_strategy(draw: st.DrawFn):
 acquisition_functions = st.one_of(
     st.builds(ExpectedImprovement),
     st.builds(ProbabilityOfImprovement),
-    st.builds(UpperConfidenceBound, beta=finite_floats(min_value=0.0)),
+    st.builds(UpperConfidenceBound, beta=finite_floats()),
     st.builds(PosteriorMean),
     st.builds(PosteriorStandardDeviation, maximize=st.sampled_from([True, False])),
     st.builds(qPosteriorStandardDeviation),
     st.builds(LogExpectedImprovement),
     st.builds(qExpectedImprovement),
     st.builds(qProbabilityOfImprovement),
-    st.builds(qUpperConfidenceBound, beta=finite_floats(min_value=0.0)),
+    st.builds(qUpperConfidenceBound, beta=finite_floats()),
     st.builds(qSimpleRegret),
     st.builds(qLogExpectedImprovement),
     st.builds(