src/convolutional_kernels.cu
@@ -2,6 +2,10 @@ #include "curand.h" #include "cublas_v2.h" #ifdef CUDNN #pragma comment(lib, "cudnn.lib") #endif extern "C" { #include "convolutional_layer.h" #include "batchnorm_layer.h" @@ -133,6 +137,9 @@ if(l.batch_normalize){ backward_batchnorm_layer_gpu(l, state); //axpy_ongpu(l.outputs*l.batch, -state.net.decay, l.x_gpu, 1, l.delta_gpu, 1); } else { //axpy_ongpu(l.outputs*l.batch, -state.net.decay, l.output_gpu, 1, l.delta_gpu, 1); } float *original_input = state.input;