cudaError_t cudaConfigureCall (dim3 p1, dim3 p2, size_t p3, cudaStream_t p4) { cudaError_t res; #if defined(DEBUG) fprintf (stderr, PACKAGE_NAME": THREAD %d cudaConfigureCall is at %p\n", THREADID, real_cudaConfigureCall); fprintf (stderr, PACKAGE_NAME": THREAD %d cudaConfigureCall params p1 p2 %d %d\n", THREADID, p3, p4); #endif if (real_cudaConfigureCall != NULL && mpitrace_on && Extrae_get_trace_CUDA()) { Extrae_cudaConfigureCall_Enter (p1, p2, p3, p4); res = real_cudaConfigureCall (p1, p2, p3, p4); Extrae_cudaConfigureCall_Exit (); } else if (real_cudaConfigureCall != NULL && !(mpitrace_on && Extrae_get_trace_CUDA())) { res = real_cudaConfigureCall (p1, p2, p3, p4); } else { fprintf (stderr, "Unable to find cudaConfigureCall in DSOs!! Dying...\n"); exit (0); } return res; }
cudaError_t cudaConfigureCall (dim3 gridDim, dim3 blockDim, size_t sharedMem, cudaStream_t stream) { cudaError_t errcode; configure_get_worksizes(&gridDim, &blockDim); temp_argument_cnt = 0; errcode = real_cudaConfigureCall(gridDim, blockDim, sharedMem, stream); return errcode; //return 1 ? cudaSuccess : errcode; }