Better BatchNorm (with ema_update option decoupled from training)

f6ede612 · Yuxin Wu · 4a46b93d · f6ede612 · f6ede612
Commit f6ede612 authored May 11, 2019 by Yuxin Wu
Expand all Hide whitespace changes
Inline Side-by-side

Showing with 72 additions and 43 deletions

examples/GAN/GAN.py examples/GAN/GAN.py +2 -2

tensorpack/models/batch_norm.py tensorpack/models/batch_norm.py +70 -41

No files found.
--- a/examples/GAN/GAN.py
+++ b/examples/GAN/GAN.py
@@ -169,8 +169,8 @@ class SeparateGANTrainer(TowerTrainer):
        # Build the graph
        self.tower_func = TowerFuncWrapper(model.build_graph, model.get_input_signature())
        with TowerContext('', is_training=True), \
-                argscope(BatchNorm, internal_update=True):
-            # should not hook the updates to both train_op, it will hurt training speed.
+                argscope(BatchNorm, ema_update='internal'):
+            # should not hook the EMA updates to both train_op, it will hurt training speed.
            self.tower_func(*input.get_input_tensors())
        update_ops = tf.get_collection(tf.GraphKeys.UPDATE_OPS)
        if len(update_ops):

--- a/tensorpack/models/batch_norm.py
+++ b/tensorpack/models/batch_norm.py