#include "stdlib.h" #include "util.h" #include "dataset.h" void __attribute__((noinline)) matmul(const int coreid, const int ncores, const int lda, const data_t A[], const data_t B[], data_t C[] ) { // ***************************** // // **** ADD YOUR CODE HERE ***** // // ***************************** // // // feel free to make a separate function for MI and MSI versions. int i, j, k, ii, jj, kk; int block = lda / ncores; int leftover = lda % ncores; int start = block * coreid; for ( j = start; j < (start+block); j++ ) for ( k = 0; k < lda; k++ ) { for ( i = 0; i < lda; i++ ) { C[i + j*lda] += A[j*lda + k] * B[k*lda + i]; } } }