diff --git a/examples/ale/train_dqn_ale.py b/examples/ale/train_dqn_ale.py index 37b9f68b1..a992ec2e3 100644 --- a/examples/ale/train_dqn_ale.py +++ b/examples/ale/train_dqn_ale.py @@ -179,6 +179,11 @@ def make_env(test): links.to_factorized_noisy(q_func) # Turn off explorer explorer = explorers.Greedy() + else: + explorer = explorers.LinearDecayEpsilonGreedy( + 1.0, args.final_epsilon, + args.final_exploration_frames, + lambda: np.random.randint(n_actions)) # Draw the computational graph and save it in the output directory. chainerrl.misc.draw_computational_graph( @@ -202,11 +207,6 @@ def make_env(test): else: rbuf = replay_buffer.ReplayBuffer(10 ** 6, args.num_step_return) - explorer = explorers.LinearDecayEpsilonGreedy( - 1.0, args.final_epsilon, - args.final_exploration_frames, - lambda: np.random.randint(n_actions)) - def phi(x): # Feature extractor return np.asarray(x, dtype=np.float32) / 255