Commit d0cb0ede authored by Yuxin Wu's avatar Yuxin Wu

[DQN] better dqn params

parent b7f10ccf
......@@ -38,7 +38,7 @@ METHOD = None
def get_player(viz=False, train=False):
env = AtariPlayer(ROM_FILE, frame_skip=ACTION_REPEAT, viz=viz,
live_lost_as_eoe=train, max_num_frames=30000)
live_lost_as_eoe=train, max_num_frames=60000)
env = FireResetEnv(env)
env = MapState(env, lambda im: cv2.resize(im, IMAGE_SIZE))
if not train:
......
......@@ -21,7 +21,7 @@ def play_one_episode(env, func, render=False):
Map from observation to action, with 0.001 greedy.
"""
act = func(s[None, :, :, :])[0][0].argmax()
if random.random() < 0.001:
if random.random() < 0.01:
spc = env.action_space
act = spc.sample()
return act
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment