Fix arguments to error message, remove tabs and trailing spaces
Этот коммит содержится в:
родитель
773b509407
Коммит
1f32fa21ae
@ -1994,8 +1994,8 @@ int mca_common_cuda_get_address_range(void *pbase, size_t *psize, void *base)
|
|||||||
CUresult result;
|
CUresult result;
|
||||||
result = cuFunc.cuMemGetAddressRange((CUdeviceptr *)pbase, psize, (CUdeviceptr)base);
|
result = cuFunc.cuMemGetAddressRange((CUdeviceptr *)pbase, psize, (CUdeviceptr)base);
|
||||||
if (OPAL_UNLIKELY(CUDA_SUCCESS != result)) {
|
if (OPAL_UNLIKELY(CUDA_SUCCESS != result)) {
|
||||||
opal_show_help("help-mpi-common-cuda.txt", "cuMemGetAddressRange failed",
|
opal_show_help("help-mpi-common-cuda.txt", "cuMemGetAddressRange failed 2",
|
||||||
true, result, base);
|
true, OPAL_PROC_MY_HOSTNAME, result, base);
|
||||||
return OPAL_ERROR;
|
return OPAL_ERROR;
|
||||||
} else {
|
} else {
|
||||||
opal_output_verbose(50, mca_common_cuda_output,
|
opal_output_verbose(50, mca_common_cuda_output,
|
||||||
@ -2054,7 +2054,8 @@ void mca_common_cuda_get_buffer_id(mca_mpool_base_registration_t *reg)
|
|||||||
res = cuFunc.cuPointerGetAttribute(&bufID, CU_POINTER_ATTRIBUTE_BUFFER_ID,
|
res = cuFunc.cuPointerGetAttribute(&bufID, CU_POINTER_ATTRIBUTE_BUFFER_ID,
|
||||||
(CUdeviceptr)dbuf);
|
(CUdeviceptr)dbuf);
|
||||||
if (OPAL_UNLIKELY(res != CUDA_SUCCESS)) {
|
if (OPAL_UNLIKELY(res != CUDA_SUCCESS)) {
|
||||||
opal_show_help("help-mpi-common-cuda.txt", "bufferID failed", true, res);
|
opal_show_help("help-mpi-common-cuda.txt", "bufferID failed",
|
||||||
|
true, OPAL_PROC_MY_HOSTNAME, res);
|
||||||
}
|
}
|
||||||
reg->gpu_bufID = bufID;
|
reg->gpu_bufID = bufID;
|
||||||
|
|
||||||
|
@ -65,6 +65,14 @@ cannot be used.
|
|||||||
Check the cuda.h file for what the return value means. Perhaps a reboot
|
Check the cuda.h file for what the return value means. Perhaps a reboot
|
||||||
of the node will clear the problem.
|
of the node will clear the problem.
|
||||||
#
|
#
|
||||||
|
[cuMemGetAddressRange failed 2]
|
||||||
|
The call to cuMemGetAddressRange failed during the GPU RDMA protocol.
|
||||||
|
Host: %s
|
||||||
|
cuMemGetAddressRange return value: %d
|
||||||
|
address: %p
|
||||||
|
Check the cuda.h file for what the return value means. This is highly
|
||||||
|
unusual and should not happen. The program will probably abort.
|
||||||
|
#
|
||||||
[Out of cuEvent handles]
|
[Out of cuEvent handles]
|
||||||
The library has exceeded its number of outstanding event handles.
|
The library has exceeded its number of outstanding event handles.
|
||||||
For better performance, this number should be increased.
|
For better performance, this number should be increased.
|
||||||
|
Загрузка…
x
Ссылка в новой задаче
Block a user