From 51477ab274bbb40be259844bdaab9685f693b028 Mon Sep 17 00:00:00 2001
From: AlexeyAB <alexeyab84@gmail.com>
Date: Mon, 24 Jul 2017 23:40:23 +0000
Subject: [PATCH] Increased 2.3 times performance of Yolo on CPU by using OpenMP in both darknet_no_gpu and yolo_cpp_dll_no_gpu
---
src/network_kernels.cu | 3 ++-
1 files changed, 2 insertions(+), 1 deletions(-)
diff --git a/src/network_kernels.cu b/src/network_kernels.cu
index a7510e8..313cd6d 100644
--- a/src/network_kernels.cu
+++ b/src/network_kernels.cu
@@ -78,6 +78,7 @@
void update_network_gpu(network net)
{
+ cuda_set_device(net.gpu_index);
int i;
int update_batch = net.batch*net.subdivisions;
float rate = get_current_rate(net);
@@ -377,7 +378,7 @@
float *get_network_output_layer_gpu(network net, int i)
{
layer l = net.layers[i];
- cuda_pull_array(l.output_gpu, l.output, l.outputs*l.batch);
+ if(l.type != REGION) cuda_pull_array(l.output_gpu, l.output, l.outputs*l.batch);
return l.output;
}
--
Gitblit v1.10.0