k-armed-bandit/random__walk_8py_source.html

import numpy

from bandit import Normal


class RandomWalk(Normal):

    """

    A random walk bandit.


    This class features k arms with rewards from the arms drawn from normal

    distributions. The means, when initialized, are drawn from a uniform range

    of [-1, 1). However, after each call to select, the means for every arm

    is changed. Each arm's mean is adjusted by a randomly selected value drawn

    from a normal distribution with mean 0 and standard deviation 0.01. These

    values are drawn independently for each arm.

    """


    def __init__(self, k: int) -> None:

        super().__init__(k)


    def select(self, index):

        rewards = super().select(index)

        # Now modify the means.

        walk_values = numpy.random.normal(loc=0.0, scale=0.01, size=self.k)

        self._mean += walk_values

        return rewards


bandit.base_bandit.BaseBandit.k
int k(self)
Return the number of arms this bandit has.
Definition base_bandit.py:26

bandit.normal.Normal
This bandit draws a reward from a set normal distribution each time an arm is chosen.
Definition normal.py:5

bandit.normal.Normal._mean
_mean
Definition normal.py:28

bandit.random_walk.RandomWalk
A random walk bandit.
Definition random_walk.py:5

bandit.random_walk.RandomWalk.__init__
None __init__(self, int k)
Construct the class.
Definition random_walk.py:17

bandit.random_walk.RandomWalk.select
select(self, index)
Select one or several arms to obtain a reward from.
Definition random_walk.py:20