We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0c88fd1 commit 57a325eCopy full SHA for 57a325e
notebooks/Chapter02_Ten_Armed_Testbed.jl
@@ -98,16 +98,14 @@ function bandit_testbed(
98
env = MultiArmBanditsEnv(;true_reward=true_reward)
99
agent = Agent(
100
policy=QBasedPolicy(
101
- learner = TDLearner(
+ learner = MonteCarloLearner(
102
approximator = TabularQApproximator(
103
n_state=length(state_space(env)),
104
n_action=length(action_space(env)),
105
init=init,
106
opt = opt
107
),
108
- γ = 1.0,
109
- method=:SARSA,
110
- n = 0,
+ γ = 1.0
111
112
explorer = explorer
113
0 commit comments