blob: f2fb3e0b4e4c7c81db97557dcac62aa0235d11a6 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
|
#include "stdlib.h"
#include "util.h"
#include "dataset.h"
void __attribute__((noinline)) matmul(const int coreid, const int ncores, const int lda, const data_t A[], const data_t B[], data_t C[] )
{
// ***************************** //
// **** ADD YOUR CODE HERE ***** //
// ***************************** //
//
// feel free to make a separate function for MI and MSI versions.
for (int i = coreid; i < lda; i+=ncores*2)
{
for (int j = 0; j < lda; j++)
{
for (int k = 0; k < lda; k++)
{
int A12 = A[j*lda + k];
int B1 = B[k*lda + i];
int B2 = B[k*lda + i + ncores];
C[i+j*lda] += A12 * B1;
C[i+ncores+j*lda] += A12 * B2;
//C[i+j*lda] += A[j*lda +k] * B[k*lda +i];
}
}
}
}
|