From 9bae70b22549b68f5cdeece8b6c3b3de00c22714 Mon Sep 17 00:00:00 2001
From: AlexeyAB <alexeyab84@gmail.com>
Date: Mon, 16 Apr 2018 23:51:11 +0000
Subject: [PATCH] Accelerated by another 5% using FP16/32 Batch-norm for Tensor Cores.

---
 src/avgpool_layer_kernels.cu |    4 ++++
 1 files changed, 4 insertions(+), 0 deletions(-)

diff --git a/src/avgpool_layer_kernels.cu b/src/avgpool_layer_kernels.cu
index 1bd2a2a..b7e2770 100644
--- a/src/avgpool_layer_kernels.cu
+++ b/src/avgpool_layer_kernels.cu
@@ -1,3 +1,7 @@
+#include "cuda_runtime.h"
+#include "curand.h"
+#include "cublas_v2.h"
+
 extern "C" {
 #include "avgpool_layer.h"
 #include "cuda.h"

--
Gitblit v1.10.0