From 05c0f12c735ebd749a36e88b0b0d9fadf0e6515d Mon Sep 17 00:00:00 2001 From: raver119 Date: Mon, 11 May 2020 16:55:23 +0300 Subject: [PATCH] bump up shared memory (#449) Signed-off-by: raver119@gmail.com --- libnd4j/include/loops/cuda/type_conversions.cu | 1 + 1 file changed, 1 insertion(+) diff --git a/libnd4j/include/loops/cuda/type_conversions.cu b/libnd4j/include/loops/cuda/type_conversions.cu index 08bdb8e61..d0dee4f0d 100644 --- a/libnd4j/include/loops/cuda/type_conversions.cu +++ b/libnd4j/include/loops/cuda/type_conversions.cu @@ -516,6 +516,7 @@ BUILD_SINGLE_TEMPLATE(template void ND4J_EXPORT cudaDecodeBitmapGeneric, (dim3 & template __host__ void prescanLauncher(dim3 &blocks, dim3 &threads, int shmem, cudaStream_t *stream, int *g_odata, const int *g_idata, int *g_blockSums, int n, int blockIndex, int baseIndex) { //printf("Prescan grid: <%i/%i/%i>; threads: <%i/%i/%i>; shareMemSize: %i\n", blocks.x, blocks.y, blocks.z, threads.x, threads.y, threads.z, shmem); + shmem = sd::math::nd4j_max(shmem, 16384); prescan<<>>(g_odata, g_idata, g_blockSums, n, blockIndex, baseIndex); };