Edmond Yoo
2018-10-11 6ef5acd9c612140cbf698c5ca1295bdba0293801
src/im2col_kernels.cu
@@ -54,7 +54,7 @@
    int width_col = (width + 2 * pad - ksize) / stride + 1;
    int num_kernels = channels * height_col * width_col;
    im2col_gpu_kernel<<<(num_kernels+BLOCK-1)/BLOCK,
        BLOCK>>>(
        BLOCK, 0, get_cuda_stream()>>>(
                num_kernels, im, height, width, ksize, pad,
                stride, height_col,
                width_col, data_col);