Source code for moe.tests.bandit.ucb.ucb1_tuned_test

# -*- coding: utf-8 -*-
"""Test UCB1-tuned bandit implementation.

Test default values with one, two, and three arms.
Test different cases including unsampled arms and multiple winners.

"""
from moe.bandit.ucb.ucb1_tuned import UCB1Tuned
from moe.tests.bandit.ucb.ucb_test_case import UCBTestCase


[docs]class TestUCB1Tuned(UCBTestCase):

    """Verify that different historical infos return correct results."""

    bandit_class = UCB1Tuned

[docs]    def test_init_default(self):
        """Verify that default values do not throw and error. This is purely an integration test."""
        self._test_init_default()

[docs]    def test_one_arm(self):
        """Check that the one-arm case always returns the given arm as the winning arm and the allocation is 1.0."""
        bandit = self.bandit_class(self.one_arm_test_case)
        self._test_one_arm(bandit)

[docs]    def test_two_unsampled_arms(self):
        """Check that the two-unsampled-arms case always allocate each arm equally (the allocation is 0.5 for both arms). This tests num_unsampled_arms == num_arms > 1."""
        self._test_two_unsampled_arms()

[docs]    def test_three_arms_one_unsampled_arm(self):
        """Check that the three-arms cases with integer and float payoffs return the expected arm allocations. When arm3 is the only unsampled arm, we expect all allocation is given to arm3."""
        self._test_three_arms_one_unsampled_arm()

[docs]    def test_three_arms_two_winners(self):
        """Check that the three-arms cases with two winners return the expected arm allocations. This tests num_arms > num_winning_arms > 1."""
        self._test_three_arms_two_winners()

[docs]    def test_three_arms_diferent_variance(self):
        """Check that the three-arms cases with different variance (same average payoff) return the expected arm allocations. The highest variance wins."""
        bandit = self.bandit_class(self.three_arms_with_variance_no_unsampled_arm_test_case)
        assert bandit.allocate_arms() == {"arm1": 1.0, "arm2": 0.0, "arm3": 0.0}