From 2b2441313b73c460a60c013c3b7bf9e19c994b6b Mon Sep 17 00:00:00 2001
From: Joseph Redmon <pjreddie@gmail.com>
Date: Thu, 30 Oct 2014 18:28:37 +0000
Subject: [PATCH] col2im maybe a little faster
---
src/convolutional_layer.c | 2 +-
1 files changed, 1 insertions(+), 1 deletions(-)
diff --git a/src/convolutional_layer.c b/src/convolutional_layer.c
index 42f4f21..fee559b 100644
--- a/src/convolutional_layer.c
+++ b/src/convolutional_layer.c
@@ -336,7 +336,7 @@
cl.error = clSetKernelArg(kernel, i++, sizeof(layer.output_cl), (void*) &layer.output_cl);
check_error(cl);
- const size_t global_size[] = {layer.batch, layer.n*size};
+ const size_t global_size[] = {layer.n*size, layer.batch};
clEnqueueNDRangeKernel(queue, kernel, 2, 0, global_size, 0, 0, 0, 0);
check_error(cl);
--
Gitblit v1.10.0