| | |
| | | #ifndef BLAS_H |
| | | #define BLAS_H |
| | | void reorg(float *x, int size, int layers, int batch, int forward); |
| | | void pm(int M, int N, float *A); |
| | | float *random_matrix(int rows, int cols); |
| | | void time_random_matrix(int TA, int TB, int m, int k, int n); |
| | |
| | | |
| | | void smooth_l1_cpu(int n, float *pred, float *truth, float *delta, float *error); |
| | | void l2_cpu(int n, float *pred, float *truth, float *delta, float *error); |
| | | void weighted_sum_cpu(float *a, float *b, float *s, int num, float *c); |
| | | |
| | | #ifdef GPU |
| | | void axpy_ongpu(int N, float ALPHA, float * X, int INCX, float * Y, int INCY); |
| | |
| | | void copy_ongpu(int N, float * X, int INCX, float * Y, int INCY); |
| | | void copy_ongpu_offset(int N, float * X, int OFFX, int INCX, float * Y, int OFFY, int INCY); |
| | | void scal_ongpu(int N, float ALPHA, float * X, int INCX); |
| | | void supp_ongpu(int N, float ALPHA, float * X, int INCX); |
| | | void mask_ongpu(int N, float * X, float mask_num, float * mask); |
| | | void const_ongpu(int N, float ALPHA, float *X, int INCX); |
| | | void pow_ongpu(int N, float ALPHA, float *X, int INCX, float *Y, int INCY); |
| | |
| | | void weighted_sum_gpu(float *a, float *b, float *s, int num, float *c); |
| | | void mult_add_into_gpu(int num, float *a, float *b, float *c); |
| | | |
| | | void reorg_ongpu(float *x, int w, int h, int c, int batch, int stride, int forward, float *out); |
| | | |
| | | #endif |
| | | #endif |