|
k-Armed Bandit 1.0.0
A collection of k-armed bandits and assoicated agents for reinforcement learning
|
Variables | |
| int | K = 10 |
| int | N = 2000 |
| int | M = 1000 |
| list | bandits = [] |
| single_bandit = bandit.Normal(k=K) | |
| list | agents |
| list | agent_names |
| rewards = numpy.zeros(shape=(len(agents), N, M), dtype=numpy.float) | |
| _table | |
| a | |
| float | cumulative_mean_reward = 0.0 |
| action = test_agent.act() | |
| list | reward = bandits[n].select(index=action) |
| mean_rewards = numpy.mean(a=rewards, axis=1) | |
|
protected |
Definition at line 45 of file analysis.py.
| analysis.a |
Definition at line 45 of file analysis.py.
| analysis.action = test_agent.act() |
Definition at line 49 of file analysis.py.
| list analysis.agent_names |
Definition at line 33 of file analysis.py.
| list analysis.agents |
Definition at line 28 of file analysis.py.
| list analysis.bandits = [] |
Definition at line 24 of file analysis.py.
| float analysis.cumulative_mean_reward = 0.0 |
Definition at line 46 of file analysis.py.
| int analysis.K = 10 |
Definition at line 17 of file analysis.py.
| int analysis.M = 1000 |
Definition at line 21 of file analysis.py.
Definition at line 58 of file analysis.py.
| int analysis.N = 2000 |
Definition at line 19 of file analysis.py.
Definition at line 50 of file analysis.py.
Definition at line 39 of file analysis.py.
| analysis.single_bandit = bandit.Normal(k=K) |
Definition at line 26 of file analysis.py.