marcoabreu closed pull request #9684: Enable dp4a for the CI

This is a PR merged from a forked repository.
diff --git a/tests/ci_build/ b/tests/ci_build/
index 794a4c55ee..768a2ed302 100755
--- a/tests/ci_build/
+++ b/tests/ci_build/
@@ -168,6 +168,10 @@ echo "Running '${COMMAND[@]}' inside ${DOCKER_IMG_NAME}..."
 # ${WORKDIR} is the working directory we start the container in.  By default 
 # is /workspace, but for example when running cmake it is sometimes 
+# Currently compiling for sm52 (g3s) and sm61(p3s).  sm61 is required to test 
DP4A support on p3
+# instances.  In the long term we should enable sm70 for p3 instances, but 
this will require
+# CUDA 9(.1) support with our base AMI drivers.
 ${DOCKER_BINARY} run --rm --pid=host \
     -v ${WORKSPACE}:/workspace \
     -w ${WORKDIR} \
@@ -176,7 +180,7 @@ ${DOCKER_BINARY} run --rm --pid=host \
     -e "CI_BUILD_UID=$(id -u)" \
     -e "CI_BUILD_GROUP=$(id -g -n)" \
     -e "CI_BUILD_GID=$(id -g)" \
-    -e "CUDA_ARCH=-gencode arch=compute_52,code=[sm_52,compute_52] 
--fatbin-options -compress-all" \
+    -e "CUDA_ARCH=-gencode arch=compute_52,code=[sm_52,compute_52] -gencode 
arch=compute_61,code=sm_61 --fatbin-options -compress-all" \


