Merge pull request #895 from NLGithubWP/update-distributed-benchmarks-dev

Add comments for device synchronization during the distributed training
diff --git a/examples/cifar_distributed_cnn/benchmark.py b/examples/cifar_distributed_cnn/benchmark.py
index 6f9ef52..9156927 100644
--- a/examples/cifar_distributed_cnn/benchmark.py
+++ b/examples/cifar_distributed_cnn/benchmark.py
@@ -80,6 +80,7 @@
         for _ in t:
             model(tx, ty, dist_option='fp32', spars=None)
 
+    # Device synchronization for more accurate time measurements during the distributed training 
     dev.Sync()
     end = time.time()
     titer = (end - start) / float(niters)