From 2b2441313b73c460a60c013c3b7bf9e19c994b6b Mon Sep 17 00:00:00 2001
From: Joseph Redmon <pjreddie@gmail.com>
Date: Thu, 30 Oct 2014 18:28:37 +0000
Subject: [PATCH] col2im maybe a little faster

---
 src/convolutional_layer.c |    2 +-
 1 files changed, 1 insertions(+), 1 deletions(-)

diff --git a/src/convolutional_layer.c b/src/convolutional_layer.c
index 42f4f21..fee559b 100644
--- a/src/convolutional_layer.c
+++ b/src/convolutional_layer.c
@@ -336,7 +336,7 @@
     cl.error = clSetKernelArg(kernel, i++, sizeof(layer.output_cl), (void*) &layer.output_cl);
     check_error(cl);
 
-    const size_t global_size[] = {layer.batch, layer.n*size};
+    const size_t global_size[] = {layer.n*size, layer.batch};
 
     clEnqueueNDRangeKernel(queue, kernel, 2, 0, global_size, 0, 0, 0, 0);
     check_error(cl);

--
Gitblit v1.10.0