6 void __attribute__((noinline
)) matmul(const int coreid
, const int ncores
, const int lda
, const data_t A
[], const data_t B
[], data_t C
[] )
8 int i
, j
, k
, n
, m
, c1
, c2
;
9 for ( j
= coreid
; j
< lda
; j
+= 2*ncores
) {
10 for ( i
= 0; i
< lda
; i
+= 1 ){
11 c1
= 0; //global vars c1, c2
13 for ( k
= 0; k
< lda
; k
+= 1 ) {
14 c1
+= A
[j
* lda
+ k
] * B
[k
*lda
+ i
];
15 c2
+= A
[(j
+ncores
) * lda
+ k
] * B
[k
*lda
+ i
];
19 C
[i
+ (j
+ncores
) * lda
] = c2
;