blob: ef376cbd286c2d05e930db22bcba34c770567afb (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
|
#include "stdlib.h"
#include "util.h"
#include "dataset.h"
void __attribute__((noinline)) matmul(const int coreid, const int ncores, const int lda, const data_t A[], const data_t B[], data_t C[] )
{
// ***************************** //
// **** ADD YOUR CODE HERE ***** //
// ***************************** //
//
// feel free to make a separate function for MI and MSI versions.
int i, j, k, ii, jj, kk;
int block = lda / ncores;
int leftover = lda % ncores;
int start = block * coreid;
for ( j = start; j < (start+block); j++ )
for ( k = 0; k < lda; k++ )
{
for ( i = 0; i < lda; i++ )
{
C[i + j*lda] += A[j*lda + k] * B[k*lda + i];
}
}
}
|