~speedprog/mtg/mtg_card_detector.git

			@@ -57,13 +57,13 @@
			l.stride = stride;
			l.size = size;

			l.filters = calloc(cnsize*size, sizeof(float));
			l.filter_updates = calloc(cnsize*size, sizeof(float));
			l.weights = calloc(cnsize*size, sizeof(float));
			l.weight_updates = calloc(cnsize*size, sizeof(float));

			l.biases = calloc(n, sizeof(float));
			l.bias_updates = calloc(n, sizeof(float));
			float scale = 1./sqrt(sizesizec);
			for(i = 0; i < cnsizesize; ++i) l.filters[i] = scalerand_normal();
			for(i = 0; i < cnsizesize; ++i) l.weights[i] = scalerand_normal();
			for(i = 0; i < n; ++i){
			l.biases[i] = scale;
			}
			@@ -81,8 +81,8 @@
			l.delta = calloc(l.batchout_h out_w * n, sizeof(float));

			#ifdef GPU
			l.filters_gpu = cuda_make_array(l.filters, cnsize*size);
			l.filter_updates_gpu = cuda_make_array(l.filter_updates, cnsize*size);
			l.weights_gpu = cuda_make_array(l.weights, cnsize*size);
			l.weight_updates_gpu = cuda_make_array(l.weight_updates, cnsize*size);

			l.biases_gpu = cuda_make_array(l.biases, n);
			l.bias_updates_gpu = cuda_make_array(l.bias_updates, n);
			@@ -137,7 +137,7 @@
			fill_cpu(l.outputs*l.batch, 0, l.output, 1);

			for(i = 0; i < l.batch; ++i){
			float *a = l.filters;
			float *a = l.weights;
			float b = state.input + il.cl.hl.w;
			float *c = l.col_image;

			@@ -167,7 +167,7 @@

			float a = state.input + im*n;
			float *b = l.col_image;
			float *c = l.filter_updates;
			float *c = l.weight_updates;

			im2col_cpu(l.delta + il.nsize, l.n, out_h, out_w,
			l.size, l.stride, 0, b);
			@@ -178,7 +178,7 @@
			int n = l.h*l.w;
			int k = l.sizel.sizel.n;

			float *a = l.filters;
			float *a = l.weights;
			float *b = l.col_image;
			float c = state.delta + in*m;

			@@ -193,9 +193,9 @@
			axpy_cpu(l.n, learning_rate, l.bias_updates, 1, l.biases, 1);
			scal_cpu(l.n, momentum, l.bias_updates, 1);

			axpy_cpu(size, -decay, l.filters, 1, l.filter_updates, 1);
			axpy_cpu(size, learning_rate, l.filter_updates, 1, l.filters, 1);
			scal_cpu(size, momentum, l.filter_updates, 1);
			axpy_cpu(size, -decay, l.weights, 1, l.weight_updates, 1);
			axpy_cpu(size, learning_rate, l.weight_updates, 1, l.weights, 1);
			scal_cpu(size, momentum, l.weight_updates, 1);
			}