k-armed-bandit/test__random_8py_source.html

from bandit import RandomWalk

import numpy

import unittest


class TestRandomWalkBandit(unittest.TestCase):

    """

    Tests the implementation of a bandit with random walk on the distributions.


    As this class inherits from Normal, the only difference is testing that the

    distribution means change after each call to select.

    """


    def test_mean_change(self):

        """

        Test that means change over time.


        The class should randomly walk the mean of the distribution of each arm

        after a call to select. So call it a number of times and watch for some

        sort of change. Because it is random, the exact change can't be known,

        so just ensure that the numbers do in fact change.

        """

        K = 100

        bandit = RandomWalk(K)

        (mean, _) = bandit.trueValues()

        previous_mean = numpy.copy(mean)

        values_have_changed = False

        # Call select a number of times. As long as it changes at least once,

        # then the method is working.

        for i in range(100):

            _ = bandit.select(0)

            (mean, _) = bandit.trueValues()

            values_have_changed |= not numpy.array_equal(previous_mean, mean)

            previous_mean = numpy.copy(mean)

        self.assertTrue(values_have_changed)


bandit.random_walk.RandomWalk
A random walk bandit.
Definition random_walk.py:5

bandit.tests.test_random.TestRandomWalkBandit
Tests the implementation of a bandit with random walk on the distributions.
Definition test_random.py:6

bandit.tests.test_random.TestRandomWalkBandit.test_mean_change
test_mean_change(self)
Test that means change over time.
Definition test_random.py:14