blob: d6ff44df5a1107b8ded158b2f98db08f7ab23810 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
|
#include <stdlib.h>
#include <stdio.h>
#define M 8
#define N 32
#pragma acc routine vector
void
vector (int *a)
{
int i;
#pragma acc loop vector
for (i = 0; i < N; i++)
a[i] -= a[i];
}
#pragma acc routine worker
void
worker (int *b)
{
int i, j;
#pragma acc loop worker
for (i = 0; i < N; i++)
{
#pragma acc loop vector
for (j = 0; j < M; j++)
b[i * M + j] += b[i * M + j];
}
}
#pragma acc routine gang
void
gang (int *a)
{
int i;
#pragma acc loop gang worker vector
for (i = 0; i < N; i++)
a[i] -= i;
}
#pragma acc routine seq
void
seq (int *a)
{
int i;
for (i = 0; i < N; i++)
a[i] += 1;
}
int
main(int argc, char **argv)
{
int i;
int a[N];
int b[M * N];
i = 0;
for (i = 0; i < N; i++)
a[i] = 0;
#pragma acc parallel copy (a[0:N])
{
#pragma acc loop seq
for (i = 0; i < N; i++)
seq (&a[0]);
}
for (i = 0; i < N; i++)
{
if (a[i] != N)
abort ();
}
#pragma acc parallel copy (a[0:N])
{
#pragma acc loop seq
for (i = 0; i < N; i++)
gang (&a[0]);
}
for (i = 0; i < N; i++)
{
if (a[i] != N + (N * (-1 * i)))
abort ();
}
for (i = 0; i < N; i++)
a[i] = i;
#pragma acc parallel copy (b[0:M*N])
{
worker (&b[0]);
}
for (i = 0; i < N; i++)
{
if (a[i] != i)
abort ();
}
for (i = 0; i < N; i++)
a[i] = i;
#pragma acc parallel copy (a[0:N])
{
#pragma acc loop
for (i = 0; i < N; i++)
vector (&a[0]);
}
for (i = 0; i < N; i++)
{
if (a[i] != 0)
abort ();
}
return 0;
}
|