diff --git a/Makefile b/Makefile index 05cebf9..7822d29 100644 --- a/Makefile +++ b/Makefile @@ -22,7 +22,7 @@ NVCC_GENCODE ?= -gencode=arch=compute_35,code=sm_35 \ CXXFLAGS := -I$(CUDA_INC) -fPIC -fvisibility=hidden NVCUFLAGS := -ccbin $(CXX) $(NVCC_GENCODE) -lineinfo -std=c++11 -maxrregcount 96 # Use addprefix so that we can specify more than one path -LDFLAGS := $(addprefix -L,${CUDA_LIB}) -lcudart +LDFLAGS := $(addprefix -L,${CUDA_LIB}) -lcudart -lrt ifeq ($(DEBUG), 0) NVCUFLAGS += -O3 diff --git a/src/core.cu b/src/core.cu index b5733cd..2eca735 100644 --- a/src/core.cu +++ b/src/core.cu @@ -728,7 +728,7 @@ ncclResult_t ncclCommInitRank(ncclComm_t* newcomm, int ndev, ncclUniqueId commId } extern "C" DSOGLOBAL -ncclResult_t ncclCommInitAll(ncclComm_t* comms, int ndev, int* devlist) { +ncclResult_t ncclCommInitAll(ncclComm_t* comms, int ndev, const int* devlist) { initDebug(); showVersion(); diff --git a/src/nccl.h b/src/nccl.h index 2ca6608..7e24031 100644 --- a/src/nccl.h +++ b/src/nccl.h @@ -63,7 +63,7 @@ ncclResult_t ncclCommInitRank(ncclComm_t* comm, int ndev, ncclUniqueId commId, i * comm should be pre-allocated with size at least ndev*sizeof(ncclComm_t). * If devlist is NULL, the first ndev CUDA devices are used. * Order of devlist defines user-order of processors within the communicator. */ -ncclResult_t ncclCommInitAll(ncclComm_t* comm, int ndev, int* devlist); +ncclResult_t ncclCommInitAll(ncclComm_t* comm, int ndev, const int* devlist); /* Frees resources associated with communicator object. */ void ncclCommDestroy(ncclComm_t comm);