c38914d4d972b4c10b644d14d6e011eb4e8baea5
4 //--------------------------------------------------------------------------
5 // single-thread, naive version
7 void __attribute__((noinline
)) matmul(const int coreid
, const int ncores
, const int lda
, const data_t A
[], const data_t B
[], data_t C
[] )
11 for ( i
= 0; i
< lda
; i
++ )
13 for ( j
= 0; j
< lda
; j
++ )
15 for ( k
= coreid
; k
< lda
; k
+=ncores
)
17 C
[i
+ j
*lda
] += A
[j
*lda
+ k
] * B
[k
*lda
+ i
];