blob: 7c579cb64c1f09e45c2061262a25a3b68c19a11c (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
|
/* { dg-do compile } */
/* { dg-options "-O2 -ffast-math -mavx512fp16 -mavx512vl -mprefer-vector-width=512" } */
/* { dg-final { scan-assembler-times "vfmaddcph\[ \\t\]" 1 } } */
/* { dg-final { scan-assembler-not "vfmadd\[123]*ph\[ \\t\]"} } */
/* { dg-final { scan-assembler-not "vfmadd\[123]*sh\[ \\t\]"} } */
/* { dg-final { scan-assembler-times "vfcmaddcph\[ \\t\]" 1 } } */
/* { dg-final { scan-assembler-times "vfmulcph\[ \\t\]" 1 } } */
/* { dg-final { scan-assembler-times "vfcmulcph\[ \\t\]" 1 } } */
#include<complex.h>
#define TYPE _Float16
#define N 16
void fma0 (_Complex TYPE *a, _Complex TYPE *b,
_Complex TYPE * __restrict c)
{
for (int i = 0; i < N; i++)
c[i] += a[i] * b[i];
}
void fmaconj (_Complex TYPE a[restrict N], _Complex TYPE b[restrict N],
_Complex TYPE c[restrict N])
{
for (int i = 0; i < N; i++)
c[i] += a[i] * ~b[i];
}
void fmul (_Complex TYPE a[restrict N], _Complex TYPE b[restrict N],
_Complex TYPE c[restrict N])
{
for (int i = 0; i < N; i++)
c[i] = a[i] * b[i];
}
void fmulconj (_Complex TYPE a[restrict N], _Complex TYPE b[restrict N],
_Complex TYPE c[restrict N])
{
for (int i = 0; i < N; i++)
c[i] = a[i] * ~b[i];
}
|