From 1b2c70f82a9ec88c60bb277f9f5f0073c96691e7 Mon Sep 17 00:00:00 2001
From: AlexeyAB <alexeyab84@gmail.com>
Date: Tue, 03 Apr 2018 13:42:00 +0000
Subject: [PATCH] Detection is accelerated by 7 percent (fused conv and batch_norm layers)

---
 src/cuda.c |    1 +
 1 files changed, 1 insertions(+), 0 deletions(-)

diff --git a/src/cuda.c b/src/cuda.c
index f168e4e..d8db851 100644
--- a/src/cuda.c
+++ b/src/cuda.c
@@ -96,6 +96,7 @@
     int i = cuda_get_device();
     if(!init[i]) {
         cublasCreate(&handle[i]);
+		cublasStatus_t status = cublasSetStream(handle[i], get_cuda_stream());
         init[i] = 1;
     }
     return handle[i];

--
Gitblit v1.10.0