From 9d23aad8696268e8ce3a94fee9490fd1db000dc8 Mon Sep 17 00:00:00 2001
From: AlexeyAB <alexeyab84@gmail.com>
Date: Sun, 31 Dec 2017 17:10:32 +0000
Subject: [PATCH] Added CUDA-streams to Darknet-Yolo forward inference
---
src/gemm.c | 1 +
1 files changed, 1 insertions(+), 0 deletions(-)
diff --git a/src/gemm.c b/src/gemm.c
index a4db8a4..c3154ec 100644
--- a/src/gemm.c
+++ b/src/gemm.c
@@ -177,6 +177,7 @@
float *C_gpu, int ldc)
{
cublasHandle_t handle = blas_handle();
+ cudaError_t stream_status = cublasSetStream(handle, get_cuda_stream());
cudaError_t status = cublasSgemm(handle, (TB ? CUBLAS_OP_T : CUBLAS_OP_N),
(TA ? CUBLAS_OP_T : CUBLAS_OP_N), N, M, K, &ALPHA, B_gpu, ldb, A_gpu, lda, &BETA, C_gpu, ldc);
check_error(status);
--
Gitblit v1.10.0