1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
| #include <stdlib.h>
| #include <stdio.h>
| #include <math.h>
| #include <time.h>
| #include <string.h>
| #include "mini_blas.h"
|
| void pm(int M, int N, float *A)
| {
| int i,j;
| for(i =0 ; i < M; ++i){
| for(j = 0; j < N; ++j){
| printf("%10.6f, ", A[i*N+j]);
| }
| printf("\n");
| }
| printf("\n");
| }
|
| float *random_matrix(int rows, int cols)
| {
| int i;
| float *m = calloc(rows*cols, sizeof(float));
| for(i = 0; i < rows*cols; ++i){
| m[i] = (float)rand()/RAND_MAX;
| }
| return m;
| }
|
| void time_random_matrix(int TA, int TB, int m, int k, int n)
| {
| float *a;
| if(!TA) a = random_matrix(m,k);
| else a = random_matrix(k,m);
| int lda = (!TA)?k:m;
| float *b;
| if(!TB) b = random_matrix(k,n);
| else b = random_matrix(n,k);
| int ldb = (!TB)?n:k;
|
| float *c = random_matrix(m,n);
| int i;
| clock_t start = clock(), end;
| for(i = 0; i<1000; ++i){
| gemm_cpu(TA,TB,m,n,k,1,a,lda,b,ldb,1,c,n);
| }
| end = clock();
| printf("Matrix Multiplication %dx%d * %dx%d, TA=%d, TB=%d: %lf ms\n",m,k,k,n, TA, TB, (float)(end-start)/CLOCKS_PER_SEC);
| free(a);
| free(b);
| free(c);
| }
|
| void test_blas()
| {
| time_random_matrix(0,0,100,100,100);
| time_random_matrix(1,0,100,100,100);
| time_random_matrix(0,1,100,100,100);
| time_random_matrix(1,1,100,100,100);
|
| time_random_matrix(0,0,1000,100,100);
| time_random_matrix(1,0,1000,100,100);
| time_random_matrix(0,1,1000,100,100);
| time_random_matrix(1,1,1000,100,100);
| }
|
|