fix colocation problems

c5e05d7a · Yuxin Wu · 5d529d03 · c5e05d7a · c5e05d7a · c5e05d7a
Commit c5e05d7a authored Sep 16, 2017 by Yuxin Wu
Showing with 6 additions and 4 deletions

tensorpack/models/regularize.py tensorpack/models/regularize.py +3 -1

tensorpack/tfutils/gradproc.py tensorpack/tfutils/gradproc.py +1 -2

tensorpack/tfutils/summary.py tensorpack/tfutils/summary.py +2 -1

No files found.
--- a/tensorpack/models/regularize.py
+++ b/tensorpack/models/regularize.py
@@ -47,12 +47,14 @@ def regularize_cost(regex, func, name='regularize_cost'):
    # If vars are replicated, only regularize those in the current tower
    params = ctx.filter_vars_by_vs_name(params)
+    G = tf.get_default_graph()
    with tf.name_scope('regularize_cost'):
        costs = []
        for p in params:
            para_name = p.name
            if re.search(regex, para_name):
-                costs.append(func(p))
+                with G.colocate_with(p):
+                    costs.append(func(p))
                _log_regularizer(para_name)
        if not costs:
            return tf.constant(0, dtype=tf.float32, name='empty_' + name)

--- a/tensorpack/tfutils/gradproc.py
+++ b/tensorpack/tfutils/gradproc.py
@@ -128,8 +128,7 @@ class MapGradient(GradientProcessor):
        for grad, var in grads:
            if re.match(self.regex, var.op.name):
                matched = True
-                with tf.device(grad.device):
+                grad = self.func(grad, var)
-                    grad = self.func(grad, var)
                if grad is not None:
                    ret.append((grad, var))
            else:

--- a/tensorpack/tfutils/summary.py
+++ b/tensorpack/tfutils/summary.py
@@ -241,8 +241,9 @@ def add_moving_summary(*args, **kwargs):
                ema_op = moving_averages.assign_moving_average(
                    ema_var, c, decay,
                    zero_debias=True, name=name + '_EMA_apply')
-            tf.summary.scalar(name + '-summary', ema_op)    # write the EMA value as a summary
            ema_ops.append(ema_op)
+        # cannot add it into colocate group -- will force everything to cpus
+        tf.summary.scalar(name + '-summary', ema_op)    # write the EMA value as a summary
    if coll is not None:
        for op in ema_ops:
            # TODO a new collection to summary every step?