From 9bae70b22549b68f5cdeece8b6c3b3de00c22714 Mon Sep 17 00:00:00 2001
From: AlexeyAB <alexeyab84@gmail.com>
Date: Mon, 16 Apr 2018 23:51:11 +0000
Subject: [PATCH] Accelerated by another 5% using FP16/32 Batch-norm for Tensor Cores.
---
src/gemm.h | 5 +++++
1 files changed, 5 insertions(+), 0 deletions(-)
diff --git a/src/gemm.h b/src/gemm.h
index 602919f..f0231bf 100644
--- a/src/gemm.h
+++ b/src/gemm.h
@@ -1,6 +1,11 @@
#ifndef GEMM_H
#define GEMM_H
+void gemm_bin(int M, int N, int K, float ALPHA,
+ char *A, int lda,
+ float *B, int ldb,
+ float *C, int ldc);
+
void gemm(int TA, int TB, int M, int N, int K, float ALPHA,
float *A, int lda,
float *B, int ldb,
--
Gitblit v1.10.0