1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
|
extern
#ifdef __cplusplus
"C"
#endif
void abort (void);
void
fn1 (double *x, double *y, int z)
{
int i;
for (i = 0; i < z; i++)
{
x[i] = i & 31;
y[i] = (i & 63) - 30;
}
}
double
fn2 (int x)
{
double s = 0;
double b[3 * x], c[3 * x], d[3 * x], e[3 * x];
int i;
fn1 (b, c, x);
fn1 (e, d + x, x);
#pragma omp target map(to: b, c[:x], d[x:x], e) map(tofrom: s)
#pragma omp parallel for reduction(+:s)
for (i = 0; i < x; i++)
s += b[i] * c[i] + d[x + i] + sizeof (b) - sizeof (c);
return s;
}
double
fn3 (int x)
{
double s = 0;
double b[3 * x], c[3 * x], d[3 * x], e[3 * x];
int i;
fn1 (b, c, x);
fn1 (e, d, x);
#pragma omp target map(tofrom: s)
#pragma omp parallel for reduction(+:s)
for (i = 0; i < x; i++)
s += b[i] * c[i] + d[i];
return s;
}
double
fn4 (int x)
{
double s = 0;
double b[3 * x], c[3 * x], d[3 * x], e[3 * x];
int i;
fn1 (b, c, x);
fn1 (e, d + x, x);
#pragma omp target data map(from: b, c[:x], d[x:x], e)
{
#pragma omp target update to(b, c[:x], d[x:x], e)
#pragma omp target map(c[:x], d[x:x], s)
#pragma omp parallel for reduction(+:s)
for (i = 0; i < x; i++)
{
s += b[i] * c[i] + d[x + i] + sizeof (b) - sizeof (c);
b[i] = i + 0.5;
c[i] = 0.5 - i;
d[x + i] = 0.5 * i;
}
}
for (i = 0; i < x; i++)
if (b[i] != i + 0.5 || c[i] != 0.5 - i || d[x + i] != 0.5 * i)
abort ();
return s;
}
int
main ()
{
double a = fn2 (128);
if (a != 14080.0)
abort ();
double b = fn3 (128);
if (a != b)
abort ();
double c = fn4 (256);
if (c != 28160.0)
abort ();
return 0;
}
|