From 1b2c70f82a9ec88c60bb277f9f5f0073c96691e7 Mon Sep 17 00:00:00 2001
From: AlexeyAB <alexeyab84@gmail.com>
Date: Tue, 03 Apr 2018 13:42:00 +0000
Subject: [PATCH] Detection is accelerated by 7 percent (fused conv and batch_norm layers)

---
 src/network.c |   35 +++++++++++++++++++++++++++++++++++
 1 files changed, 35 insertions(+), 0 deletions(-)

diff --git a/src/network.c b/src/network.c
index 175c102..bfade3c 100644
--- a/src/network.c
+++ b/src/network.c
@@ -748,3 +748,38 @@
 	free(net.workspace);
 #endif
 }
+
+
+void fuse_conv_batchnorm(network net)
+{
+	int j;
+	for (j = 0; j < net.n; ++j) {
+		layer *l = &net.layers[j];
+
+		if (l->type == CONVOLUTIONAL) {
+			printf(" Fuse Convolutional layer \t\t l->size = %d  \n", l->size);
+
+			if (l->batch_normalize) {
+				int f;
+				for (f = 0; f < l->n; ++f)
+				{
+					l->biases[f] = l->biases[f] - l->scales[f] * l->rolling_mean[f] / (sqrtf(l->rolling_variance[f]) + .000001f);
+
+					const size_t filter_size = l->size*l->size*l->c;
+					int i;
+					for (i = 0; i < filter_size; ++i) {
+						int w_index = f*filter_size + i;
+
+						l->weights[w_index] = l->weights[w_index] * l->scales[f] / (sqrtf(l->rolling_variance[f]) + .000001f);
+					}
+				}
+
+				l->batch_normalize = 0;
+				push_convolutional_layer(*l);
+			}
+		}
+		else {
+			printf(" Skip layer: %d \n", l->type);
+		}
+	}
+}

--
Gitblit v1.10.0