Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
S
seminar-breakout
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Shashank Suhas
seminar-breakout
Commits
5b18f8be
Commit
5b18f8be
authored
Jun 03, 2017
by
Yuxin Wu
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
bugfix in replicated training varscope
parent
3ab6d2b0
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
4 additions
and
1 deletion
+4
-1
tensorpack/callbacks/saver.py
tensorpack/callbacks/saver.py
+1
-0
tensorpack/tfutils/tower.py
tensorpack/tfutils/tower.py
+2
-0
tensorpack/train/multigpu.py
tensorpack/train/multigpu.py
+1
-1
No files found.
tensorpack/callbacks/saver.py
View file @
5b18f8be
...
@@ -43,6 +43,7 @@ class ModelSaver(Callback):
...
@@ -43,6 +43,7 @@ class ModelSaver(Callback):
vars
=
[]
vars
=
[]
for
key
in
self
.
var_collections
:
for
key
in
self
.
var_collections
:
vars
.
extend
(
tf
.
get_collection
(
key
))
vars
.
extend
(
tf
.
get_collection
(
key
))
vars
=
list
(
set
(
vars
))
self
.
path
=
os
.
path
.
join
(
self
.
checkpoint_dir
,
'model'
)
self
.
path
=
os
.
path
.
join
(
self
.
checkpoint_dir
,
'model'
)
if
get_tf_version_number
()
<=
1.1
:
if
get_tf_version_number
()
<=
1.1
:
self
.
saver
=
tf
.
train
.
Saver
(
self
.
saver
=
tf
.
train
.
Saver
(
...
...
tensorpack/tfutils/tower.py
View file @
5b18f8be
...
@@ -43,6 +43,8 @@ class TowerContext(object):
...
@@ -43,6 +43,8 @@ class TowerContext(object):
assert
self
.
_name
assert
self
.
_name
if
vs_name
is
None
:
if
vs_name
is
None
:
self
.
_vs_name
=
self
.
_name
self
.
_vs_name
=
self
.
_name
else
:
self
.
_vs_name
=
vs_name
else
:
else
:
assert
vs_name
is
None
,
"vs_name is only valid in 'replicated' mode!"
assert
vs_name
is
None
,
"vs_name is only valid in 'replicated' mode!"
self
.
_vs_name
=
''
self
.
_vs_name
=
''
...
...
tensorpack/train/multigpu.py
View file @
5b18f8be
...
@@ -259,7 +259,7 @@ class SyncMultiGPUTrainerReplicated(MultiGPUTrainerBase, SingleCostFeedfreeTrain
...
@@ -259,7 +259,7 @@ class SyncMultiGPUTrainerReplicated(MultiGPUTrainerBase, SingleCostFeedfreeTrain
lambda
:
self
.
_get_cost_and_grad
()[
1
],
lambda
:
self
.
_get_cost_and_grad
()[
1
],
var_strategy
=
'replicated'
,
var_strategy
=
'replicated'
,
# use no variable scope for the first tower
# use no variable scope for the first tower
vs_names
=
[
''
]
+
[
None
]
*
self
.
config
.
nr_tower
-
1
)
vs_names
=
[
''
]
+
[
None
]
*
(
self
.
config
.
nr_tower
-
1
)
)
grads
=
self
.
_allreduce_grads
(
grad_list
)
grads
=
self
.
_allreduce_grads
(
grad_list
)
train_ops
=
[]
train_ops
=
[]
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment