48 err = cudaOccupancyMaxPotentialBlockSize(&min_grid_size, &block_size,
49 kernel, dynamic_smem_size, 0);
51 if (err != cudaSuccess)
53 fprintf(stderr,
"ERROR: cudaOccupancyMaxPotentialBlockSize failed (%d)\n", err);
58 grid_size = (elements + block_size - 1) / block_size;
60 return make_int2(grid_size, block_size);
int2 launch_parameters(T kernel, size_t elements, int dynamic_smem_size=0)