use stat in DQN instead of reward

208de18c · Yuxin Wu · 5fd47e6d · 208de18c
Commit 208de18c authored May 29, 2016 by Yuxin Wu
Show whitespace changes
Inline Side-by-side

Showing with 3 additions and 3 deletions

examples/Atari2600/DQN.py examples/Atari2600/DQN.py +3 -3

No files found.
--- a/examples/Atari2600/DQN.py
+++ b/examples/Atari2600/DQN.py
@@ -136,7 +136,6 @@ def current_predictor(state):
    return pred[0]

 def play_one_episode(player, func, verbose=False):
-    tot_reward = 0
    while True:
        s = player.current_state()
        outputs = func([[s]])
@@ -149,9 +148,10 @@ def play_one_episode(player, func, verbose=False):
        if verbose:
            print(act)
        reward, isOver = player.action(act)
-        tot_reward += reward
        if isOver:
-            return tot_reward
+            sc = player.stats['score'][0]
+            player.reset_stat()
+            return sc

 def play_model(model_path):
    player = PreventStuckPlayer(HistoryFramePlayer(get_player(0.01), FRAME_HISTORY), 30, 1)