Skip to content

Commit

Permalink
only global rank 0 can log tensorboard data; avoid multi gpu/node rac…
Browse files Browse the repository at this point in the history
…e for the log directory (#296)
  • Loading branch information
arashashari authored Jul 21, 2020
1 parent 376818e commit 1f97242
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions deepspeed/pt/deepspeed_light.py
Original file line number Diff line number Diff line change
Expand Up @@ -144,12 +144,12 @@ def __init__(self,
self._configure_with_arguments(args, mpu)
self._do_sanity_check()

self._init_distributed(dist_init_required)

self.sample_count = 0
if self.tensorboard_enabled():
if self.tensorboard_enabled() and self.global_rank == 0:
self.summary_writer = self.get_summary_writer()

self._init_distributed(dist_init_required)

# Configure distributed model
self._configure_distributed_model(model)

Expand Down

0 comments on commit 1f97242

Please sign in to comment.