static void __nv_cudaEntityRegisterCallback(void **__T21){__nv_dummy_param_ref(__T21);__nv_save_fatbinhandle_for_managed_rt(__T21);__cudaRegisterVariable(__T21, __shadow_var(_ZN14KernelLaunches11queueCountsE,::KernelLaunches::queueCounts), 0, 4096, 0, 0);}
static void __nv_cudaEntityRegisterCallback( void **__T20) {  __nv_dummy_param_ref(__T20); __nv_save_fatbinhandle_for_managed_rt(__T20); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, int, int))columnwiseMaxIndex), _Z18columnwiseMaxIndexPfS_ii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, int, int))columnwiseMax), _Z13columnwiseMaxPfS_ii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, float, float *, float, int, int))matrixHadamard), _Z14matrixHadamardPfS_fS_fii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, float *, float *, float *, int))DqnStanfordEvaluation), _Z21DqnStanfordEvaluationPfS_S_S_S_i, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, float *, float *, float *, float *, float, float *, int, int))matrixBellmanErrorAndDeriv), _Z26matrixBellmanErrorAndDerivPfS_S_S_S_S_fS_ii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, float *, int, int))matrixCrossEntropyError), _Z23matrixCrossEntropyErrorPfS_S_ii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, float *, int, int))matrixIncorporateSigmoidDeriv), _Z29matrixIncorporateSigmoidDerivPfS_S_ii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, int, int))matrixSigmoid), _Z13matrixSigmoidPfS_ii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, float *, int, int))matrixIncorporateReLuDeriv), _Z26matrixIncorporateReLuDerivPfS_S_ii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, int, int))matrixReLu), _Z10matrixReLuPfS_ii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, float *, int, int))matrixIncorporateTanhDeriv), _Z26matrixIncorporateTanhDerivPfS_S_ii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, int, int))matrixTanh), _Z10matrixTanhPfS_ii, (-1)); __cudaRegisterEntry(__T20, ((void ( *)(float *, float *, float *, int, int))matrixPlusVector), _Z16matrixPlusVectorPfS_S_ii, (-1)); }