Sync BatchNorm statistics with nccl or horovod

07783edb · Yuxin Wu · bffcfc1b · 07783edb · 07783edb
Commit 07783edb authored Jun 28, 2018 by Yuxin Wu
Expand all Show whitespace changes
Inline Side-by-side

Showing with 161 additions and 52 deletions

tensorpack/models/_old_batch_norm.py tensorpack/models/_old_batch_norm.py +0 -2

tensorpack/models/batch_norm.py tensorpack/models/batch_norm.py +161 -50

No files found.
--- a/tensorpack/models/_old_batch_norm.py
+++ b/tensorpack/models/_old_batch_norm.py
@@ -36,7 +36,6 @@ def get_bn_variables(n_out, use_scale, use_bias, gamma_init):
 def update_bn_ema(xn, batch_mean, batch_var,
                  moving_mean, moving_var, decay, internal_update):
-    # TODO is there a way to use zero_debias in multi-GPU?
    update_op1 = moving_averages.assign_moving_average(
        moving_mean, batch_mean, decay, zero_debias=False,
        name='mean_ema_op')
@@ -147,7 +146,6 @@ def BatchNorm(inputs, training=None, momentum=0.9, epsilon=1e-5,
                    mean=moving_mean, variance=moving_var, epsilon=epsilon,
                    data_format=data_format, is_training=False)
            else:
-                # avoid the reshape if possible (when channel is the last dimension)
                xn = tf.nn.batch_normalization(
                    inputs, moving_mean, moving_var, beta, gamma, epsilon)

--- a/tensorpack/models/batch_norm.py
+++ b/tensorpack/models/batch_norm.py