| | |
| | | return layer; |
| | | } |
| | | |
| | | void resize_maxpool_layer(maxpool_layer *layer, int h, int w, int c) |
| | | void resize_maxpool_layer(maxpool_layer *layer, int h, int w) |
| | | { |
| | | layer->h = h; |
| | | layer->w = w; |
| | | layer->c = c; |
| | | layer->output = realloc(layer->output, ((h-1)/layer->stride+1) * ((w-1)/layer->stride+1) * c * layer->batch* sizeof(float)); |
| | | layer->delta = realloc(layer->delta, ((h-1)/layer->stride+1) * ((w-1)/layer->stride+1) * c * layer->batch*sizeof(float)); |
| | | int output_size = ((h-1)/layer->stride+1) * ((w-1)/layer->stride+1) * layer->c * layer->batch; |
| | | layer->output = realloc(layer->output, output_size * sizeof(float)); |
| | | layer->delta = realloc(layer->delta, output_size * sizeof(float)); |
| | | |
| | | #ifdef GPU |
| | | cuda_free((float *)layer->indexes_gpu); |
| | | cuda_free(layer->output_gpu); |
| | | cuda_free(layer->delta_gpu); |
| | | layer->indexes_gpu = cuda_make_int_array(output_size); |
| | | layer->output_gpu = cuda_make_array(layer->output, output_size); |
| | | layer->delta_gpu = cuda_make_array(layer->delta, output_size); |
| | | #endif |
| | | } |
| | | |
| | | void forward_maxpool_layer(const maxpool_layer layer, float *input) |
| | | void forward_maxpool_layer(const maxpool_layer layer, network_state state) |
| | | { |
| | | int b,i,j,k,l,m; |
| | | int w_offset = (-layer.size-1)/2 + 1; |
| | |
| | | int index = cur_w + layer.w*(cur_h + layer.h*(k + b*layer.c)); |
| | | int valid = (cur_h >= 0 && cur_h < layer.h && |
| | | cur_w >= 0 && cur_w < layer.w); |
| | | float val = (valid != 0) ? input[index] : -FLT_MAX; |
| | | float val = (valid != 0) ? state.input[index] : -FLT_MAX; |
| | | max_i = (val > max) ? index : max_i; |
| | | max = (val > max) ? val : max; |
| | | } |
| | |
| | | } |
| | | } |
| | | |
| | | void backward_maxpool_layer(const maxpool_layer layer, float *delta) |
| | | void backward_maxpool_layer(const maxpool_layer layer, network_state state) |
| | | { |
| | | int i; |
| | | int h = (layer.h-1)/layer.stride + 1; |
| | | int w = (layer.w-1)/layer.stride + 1; |
| | | int c = layer.c; |
| | | memset(delta, 0, layer.batch*layer.h*layer.w*layer.c*sizeof(float)); |
| | | memset(state.delta, 0, layer.batch*layer.h*layer.w*layer.c*sizeof(float)); |
| | | for(i = 0; i < h*w*c*layer.batch; ++i){ |
| | | int index = layer.indexes[i]; |
| | | delta[index] += layer.delta[i]; |
| | | state.delta[index] += layer.delta[i]; |
| | | } |
| | | } |
| | | |