This is an automated email from the ASF dual-hosted git repository.
jxie pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/incubator-mxnet.git
The following commit(s) were added to refs/heads/master by this push:
new 02b69db Limit the test_nccl.py to run on 8 GPUs (#9441)
02b69db is described below
commit 02b69db318a714ee0d327f62780986740f972fd1
Author: Amol Lele <[email protected]>
AuthorDate: Mon Jan 15 15:08:13 2018 -0800
Limit the test_nccl.py to run on 8 GPUs (#9441)
---
tests/python/gpu/test_nccl.py | 10 +++++++++-
1 file changed, 9 insertions(+), 1 deletion(-)
diff --git a/tests/python/gpu/test_nccl.py b/tests/python/gpu/test_nccl.py
index fd27c0b..8e00ba0 100644
--- a/tests/python/gpu/test_nccl.py
+++ b/tests/python/gpu/test_nccl.py
@@ -21,7 +21,15 @@ import unittest
shapes = [(10), (100), (1000), (10000), (100000), (2,2), (2,3,4,5,6,7,8)]
keys = [1,2,3,4,5,6,7]
-gpus = range(1,1+len(mx.test_utils.list_gpus()))
+num_gpus = len(mx.test_utils.list_gpus())
+
+
+if num_gpus > 8 :
+ print("The machine has {} gpus. We will run the test on 8
gpus.".format(num_gpus))
+ print("There is a limit for all PCI-E hardware on creating number of P2P
peers. The limit is 8.")
+ num_gpus = 8;
+
+gpus = range(1,1+num_gpus)
@unittest.skip("Test requires NCCL library installed and enabled during build")
def test_nccl_pushpull():
--
To stop receiving notification emails like this one, please contact
['"[email protected]" <[email protected]>'].