#include "stdlib.h" #include "util.h" #include "dataset.h" void __attribute__((noinline)) matmul(const int coreid, const int ncores, const int lda, const data_t A[], const data_t B[], data_t C[] ) { int i,j,k,a,b,b1,a1,a2,a3,c,c1,c2,c3,b2,b3; for (j=coreid*4; j