Commit d2048681 authored by Yuxin Wu's avatar Yuxin Wu

minor update.

parent fe41b5f0
...@@ -113,6 +113,7 @@ def get_config(): ...@@ -113,6 +113,7 @@ def get_config():
nr_tower = max(get_nr_gpu(), 1) nr_tower = max(get_nr_gpu(), 1)
batch = args.batch batch = args.batch
total_batch = batch * nr_tower total_batch = batch * nr_tower
assert total_batch >= 256 # otherwise the learning rate warmup is wrong.
BASE_LR = 0.01 * (total_batch / 256.) BASE_LR = 0.01 * (total_batch / 256.)
logger.info("Running on {} towers. Batch size per tower: {}".format(nr_tower, batch)) logger.info("Running on {} towers. Batch size per tower: {}".format(nr_tower, batch))
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment