1
1

Fix arguments to error message, remove tabs and trailing spaces

Этот коммит содержится в:
Rolf vandeVaart 2015-07-23 10:02:45 -04:00
родитель 773b509407
Коммит 1f32fa21ae
2 изменённых файлов: 16 добавлений и 7 удалений

Просмотреть файл

@ -1750,8 +1750,8 @@ static int mca_common_cuda_is_gpu_buffer(const void *pUserBuf, opal_convertor_t
res = cuFunc.cuPointerGetAttributes(3, attributes, attrdata, dbuf); res = cuFunc.cuPointerGetAttributes(3, attributes, attrdata, dbuf);
OPAL_OUTPUT_VERBOSE((101, mca_common_cuda_output, OPAL_OUTPUT_VERBOSE((101, mca_common_cuda_output,
"dbuf=%p, memType=%d, ctx=%p, isManaged=%d, res=%d", "dbuf=%p, memType=%d, ctx=%p, isManaged=%d, res=%d",
(void *)dbuf, (int)memType, (void *)ctx, isManaged, res)); (void *)dbuf, (int)memType, (void *)ctx, isManaged, res));
/* Mark unified memory buffers with a flag. This will allow all unified /* Mark unified memory buffers with a flag. This will allow all unified
* memory to be forced through host buffers. Note that this memory can * memory to be forced through host buffers. Note that this memory can
@ -1994,8 +1994,8 @@ int mca_common_cuda_get_address_range(void *pbase, size_t *psize, void *base)
CUresult result; CUresult result;
result = cuFunc.cuMemGetAddressRange((CUdeviceptr *)pbase, psize, (CUdeviceptr)base); result = cuFunc.cuMemGetAddressRange((CUdeviceptr *)pbase, psize, (CUdeviceptr)base);
if (OPAL_UNLIKELY(CUDA_SUCCESS != result)) { if (OPAL_UNLIKELY(CUDA_SUCCESS != result)) {
opal_show_help("help-mpi-common-cuda.txt", "cuMemGetAddressRange failed", opal_show_help("help-mpi-common-cuda.txt", "cuMemGetAddressRange failed 2",
true, result, base); true, OPAL_PROC_MY_HOSTNAME, result, base);
return OPAL_ERROR; return OPAL_ERROR;
} else { } else {
opal_output_verbose(50, mca_common_cuda_output, opal_output_verbose(50, mca_common_cuda_output,
@ -2054,7 +2054,8 @@ void mca_common_cuda_get_buffer_id(mca_mpool_base_registration_t *reg)
res = cuFunc.cuPointerGetAttribute(&bufID, CU_POINTER_ATTRIBUTE_BUFFER_ID, res = cuFunc.cuPointerGetAttribute(&bufID, CU_POINTER_ATTRIBUTE_BUFFER_ID,
(CUdeviceptr)dbuf); (CUdeviceptr)dbuf);
if (OPAL_UNLIKELY(res != CUDA_SUCCESS)) { if (OPAL_UNLIKELY(res != CUDA_SUCCESS)) {
opal_show_help("help-mpi-common-cuda.txt", "bufferID failed", true, res); opal_show_help("help-mpi-common-cuda.txt", "bufferID failed",
true, OPAL_PROC_MY_HOSTNAME, res);
} }
reg->gpu_bufID = bufID; reg->gpu_bufID = bufID;

Просмотреть файл

@ -65,6 +65,14 @@ cannot be used.
Check the cuda.h file for what the return value means. Perhaps a reboot Check the cuda.h file for what the return value means. Perhaps a reboot
of the node will clear the problem. of the node will clear the problem.
# #
[cuMemGetAddressRange failed 2]
The call to cuMemGetAddressRange failed during the GPU RDMA protocol.
Host: %s
cuMemGetAddressRange return value: %d
address: %p
Check the cuda.h file for what the return value means. This is highly
unusual and should not happen. The program will probably abort.
#
[Out of cuEvent handles] [Out of cuEvent handles]
The library has exceeded its number of outstanding event handles. The library has exceeded its number of outstanding event handles.
For better performance, this number should be increased. For better performance, this number should be increased.