__kernel void col2im(__global float *data_col, int batch, int channels, int height, int width, int ksize, int stride, int pad, __global float *data_im) { int height_col = (height - ksize) / stride + 1; int width_col = (width - ksize) / stride + 1; if (pad){ height_col = 1 + (height-1) / stride; width_col = 1 + (width-1) / stride; pad = ksize/2; } int id = get_global_id(0); int index = id; int w = id%width + pad; id /= width; int h = id%height + pad; id /= height; int c = id%channels; id /= channels; int b = id%batch; int w_start = (w