From a284a7da8d1facbf984a22302665a2a50295a687 Mon Sep 17 00:00:00 2001 From: AlexeyAB <alexeyab84@gmail.com> Date: Wed, 08 Aug 2018 16:08:58 +0000 Subject: [PATCH] Try to use avx_hs() - slow and requires alignment 4096 bits < (l.size*l.size*l.c) May be faster only from 8192 bits and more. --- src/convolutional_layer.h | 3 +++ 1 files changed, 3 insertions(+), 0 deletions(-) diff --git a/src/convolutional_layer.h b/src/convolutional_layer.h index da98dce..dd79c48 100644 --- a/src/convolutional_layer.h +++ b/src/convolutional_layer.h @@ -21,6 +21,7 @@ void backward_bias_gpu(float *bias_updates, float *delta, int batch, int n, int size); #ifdef CUDNN void cudnn_convolutional_setup(layer *l, int cudnn_preference); +void cuda_convert_f32_to_f16(float* input_f32, size_t size, float *output_f16); #endif #endif @@ -34,6 +35,8 @@ void swap_binary(convolutional_layer *l); void binarize_weights2(float *weights, int n, int size, char *binary, float *scales); +void binary_transpose_align_weights(convolutional_layer *l, size_t ldb_align); + void backward_convolutional_layer(convolutional_layer layer, network_state state); void add_bias(float *output, float *biases, int batch, int n, int size); -- Gitblit v1.10.0