From cad4d1618fee74471d335314cb77070fee951a42 Mon Sep 17 00:00:00 2001 From: AlexeyAB <alexeyab84@gmail.com> Date: Sun, 25 Feb 2018 13:29:44 +0000 Subject: [PATCH] Added support for Tensor Cores CC >= 7.0 (V100). For FP16/32 (mixed precision) define CUDNN_HALF should be used. --- src/layer.c | 2 ++ 1 files changed, 2 insertions(+), 0 deletions(-) diff --git a/src/layer.c b/src/layer.c index b88c941..582cbb3 100644 --- a/src/layer.c +++ b/src/layer.c @@ -83,6 +83,8 @@ if (l.x_norm_gpu) cuda_free(l.x_norm_gpu); if (l.weights_gpu) cuda_free(l.weights_gpu); if (l.weight_updates_gpu) cuda_free(l.weight_updates_gpu); + if (l.weights_gpu16) cuda_free(l.weights_gpu16); + if (l.weight_updates_gpu16) cuda_free(l.weight_updates_gpu16); if (l.biases_gpu) cuda_free(l.biases_gpu); if (l.bias_updates_gpu) cuda_free(l.bias_updates_gpu); if (l.scales_gpu) cuda_free(l.scales_gpu); -- Gitblit v1.10.0