/************************************************************************* * Copyright (c) 2015-2016, NVIDIA CORPORATION. All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * * Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * Neither the name of NVIDIA CORPORATION nor the names of its * contributors may be used to endorse or promote products derived * from this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. ************************************************************************/ #include #include #include #include "nccl.h" #include "mpi.h" #include "test_utilities.h" #define SIZE 128 #define NITERS 1 int main(int argc, char *argv[]) { ncclUniqueId commId; int size, rank; ncclResult_t ret; MPI_Init(&argc, &argv); MPI_Comm_size(MPI_COMM_WORLD, &size); MPI_Comm_rank(MPI_COMM_WORLD, &rank); if (argc < size) { if (rank == 0) printf("Usage : %s \n", argv[0]); exit(1); } int gpu = atoi(argv[rank+1]); // We have to set our device before NCCL init CUDACHECK(cudaSetDevice(gpu)); MPI_Barrier(MPI_COMM_WORLD); // NCCL Communicator creation ncclComm_t comm; NCCLCHECK(ncclGetUniqueId(&commId)); MPI_Bcast(&commId, NCCL_UNIQUE_ID_BYTES, MPI_CHAR, 0, MPI_COMM_WORLD); ret = ncclCommInitRank(&comm, size, commId, rank); if (ret != ncclSuccess) { printf("NCCL Init failed (%d) '%s'\n", ret, ncclGetErrorString(ret)); exit(1); } // CUDA stream creation cudaStream_t stream; cudaStreamCreateWithFlags(&stream, cudaStreamNonBlocking); // Initialize input values int *dptr; CUDACHECK(cudaMalloc(&dptr, SIZE*2*sizeof(int))); int *val = (int*) malloc(SIZE*sizeof(int)); for (int v=0; v