update docs

6efe0deb · Yuxin Wu · c2cec01e · 6efe0deb · 6efe0deb · 6efe0deb
Commit 6efe0deb authored Dec 17, 2017 by Yuxin Wu
3 changed files
--- a/tensorpack/graph_builder/distributed.py
+++ b/tensorpack/graph_builder/distributed.py
@@ -23,7 +23,7 @@ class DistributedReplicatedBuilder(DataParallelBuilder):
    and get synchronously applied to the global copy of variables located on PS.
    Then each worker copy the latest variables from PS back to local.
-    It is an equivalent of `--variable_update=distributed_replicated` in
+    It is an equivalent of ``--variable_update=distributed_replicated`` in
    `tensorflow/benchmarks <https://github.com/tensorflow/benchmarks>`_.
    Note:

--- a/tensorpack/graph_builder/training.py
+++ b/tensorpack/graph_builder/training.py
@@ -106,7 +106,7 @@ class SyncMultiGPUParameterServerBuilder(DataParallelBuilder):
    shared variable scope. It synchronoizes the gradients computed
    from each tower, averages them and applies to the shared variables.
-    It is an equivalent of `--variable_update=parameter_server` in
+    It is an equivalent of ``--variable_update=parameter_server`` in
    `tensorflow/benchmarks <https://github.com/tensorflow/benchmarks>`_.
    """
    def __init__(self, towers, ps_device=None):
@@ -165,7 +165,7 @@ class SyncMultiGPUReplicatedBuilder(DataParallelBuilder):
    It will build one tower on each GPU under its own variable scope.
    Each gradient update is averaged across or GPUs through NCCL.
-    It is an equivalent of `--variable_update=replicated` in
+    It is an equivalent of ``--variable_update=replicated`` in
    `tensorflow/benchmarks <https://github.com/tensorflow/benchmarks>`_.
    """

--- a/tensorpack/train/trainers.py
+++ b/tensorpack/train/trainers.py
@@ -71,13 +71,16 @@ class SyncMultiGPUTrainerParameterServer(SingleCostTrainer):
    """
    @map_arg(gpus=_int_to_range)
-    def __init__(self, gpus, ps_device='gpu'):
+    def __init__(self, gpus, ps_device=None):
        """
        Args:
            gpus ([int]): list of GPU ids.
-            ps_device: either 'gpu' or 'cpu', where variables are stored.  Setting to 'cpu' might help when #gpu>=4
+            ps_device: either 'gpu' or 'cpu', where variables are stored.
+                The default value is subject to change.
        """
        self.devices = gpus
+        if ps_device is None:
+            ps_device = 'gpu' if len(gpus) <= 2 else 'cpu'
        self._builder = SyncMultiGPUParameterServerBuilder(gpus, ps_device)
        super(SyncMultiGPUTrainerParameterServer, self).__init__()