Add network communication through another GPU connected with NVLink (PXN). Add aggregation of messages coming from different local GPUs through PXN and going to the same destination. Add new v5 plugin API with grouped receives and tags. Add compat for v4 plugins. Add naming of NCCL threads to help debugging. Fix NVLink detection and avoid data corruption when some NVLinks are down. Add support for Relaxed Ordering for IB. Add profiling and timing infrastructure.
29 lines
1.4 KiB
C++
29 lines
1.4 KiB
C++
/*************************************************************************
|
|
* Copyright (c) 2022, NVIDIA CORPORATION. All rights reserved.
|
|
*
|
|
* See LICENSE.txt for license information
|
|
************************************************************************/
|
|
|
|
/* Define weak symbols used to allow libnccl_static.a to work with older libcudart_static.a */
|
|
|
|
enum cudaError_t { cudaErrorStubLibrary = 34 };
|
|
|
|
extern "C" {
|
|
|
|
cudaError_t cudaStreamGetCaptureInfo_v2(...) __attribute__((visibility("hidden"))) __attribute((weak));
|
|
cudaError_t cudaStreamGetCaptureInfo_v2(...) { return cudaErrorStubLibrary; }
|
|
|
|
cudaError_t cudaUserObjectCreate(...) __attribute__((visibility("hidden"))) __attribute((weak));
|
|
cudaError_t cudaUserObjectCreate(...) { return cudaErrorStubLibrary; }
|
|
|
|
cudaError_t cudaGraphRetainUserObject(...) __attribute__((visibility("hidden"))) __attribute((weak));
|
|
cudaError_t cudaGraphRetainUserObject(...) { return cudaErrorStubLibrary; }
|
|
|
|
cudaError_t cudaStreamUpdateCaptureDependencies(...) __attribute__((visibility("hidden"))) __attribute((weak));
|
|
cudaError_t cudaStreamUpdateCaptureDependencies(...) { return cudaErrorStubLibrary; }
|
|
|
|
cudaError_t cudaGetDriverEntryPoint(...) __attribute__((visibility("hidden"))) __attribute((weak));
|
|
cudaError_t cudaGetDriverEntryPoint(...) { return cudaErrorStubLibrary; }
|
|
|
|
}
|