Merge pull request #895 from NLGithubWP/update-distributed-benchmarks-dev
Add comments for device synchronization during the distributed training
diff --git a/examples/cifar_distributed_cnn/benchmark.py b/examples/cifar_distributed_cnn/benchmark.py
index 6f9ef52..9156927 100644
--- a/examples/cifar_distributed_cnn/benchmark.py
+++ b/examples/cifar_distributed_cnn/benchmark.py
@@ -80,6 +80,7 @@
for _ in t:
model(tx, ty, dist_option='fp32', spars=None)
+ # Device synchronization for more accurate time measurements during the distributed training
dev.Sync()
end = time.time()
titer = (end - start) / float(niters)