blob: eb76ffad9c533a9c5ae32452253a32e5193d3e7c [file] [log] [blame]
#include "stdlib.h"
#include "util.h"
#include "dataset.h"
void __attribute__((noinline)) matmul(const int coreid, const int ncores, const int lda, const data_t A[], const data_t B[], data_t C[] )
{
// ***************************** //
// **** ADD YOUR CODE HERE ***** //
int i, j, k, limit, end, kblock, iblock, r, jblock;
int tempA1;
int tempB1;
limit = lda / ncores;
j = (coreid)*limit;
end = (coreid+1)*limit;
kblock = 1;
iblock = 1;
jblock = 1;
for (; j < end; j+= jblock)
for ( k = 0; k < lda; k = k + kblock )
{
r = j*lda + k;
tempA1 = A[r];
for ( i = 0; i < lda; i = i + iblock ) {
tempB1 = k*lda + i;
C[i + j*lda] += tempA1*B[tempB1];
}
barrier(ncores);
}
// ***************************** //
//
// feel free to make a separate function for MI and MSI versions.
}