1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
|
/* { dg-do run { target { powerpc*-*-linux* && { lp64 && p9vector_hw } } } } */
/* { dg-require-effective-target powerpc_p9vector_ok } */
/* { dg-options "-O2 -mpower9-vector -mpower9-misc" } */
#include <amo.h>
#include <stdint.h>
#include <stdlib.h>
/* Test whether the ISA 3.0 amo (atomic memory operations) functions perform as
expected. */
/* 32-bit tests. */
static uint32_t u32_ld[4] = {
9, /* add */
7, /* xor */
6, /* ior */
7, /* and */
};
static uint32_t u32_st[4] = {
9, /* add */
7, /* xor */
6, /* ior */
7, /* and */
};
static uint32_t u32_result[4];
static uint32_t u32_update[4] = {
9 + 1, /* add */
7 ^ 1, /* xor */
6 | 1, /* ior */
7 & 1, /* and */
};
static uint32_t u32_prev[4] = {
9, /* add */
7, /* xor */
6, /* ior */
7, /* and */
};
/* 64-bit tests. */
static uint64_t u64_ld[4] = {
9, /* add */
7, /* xor */
6, /* ior */
7, /* and */
};
static uint64_t u64_st[4] = {
9, /* add */
7, /* xor */
6, /* ior */
7, /* and */
};
static uint64_t u64_result[4];
static uint64_t u64_update[4] = {
9 + 1, /* add */
7 ^ 1, /* xor */
6 | 1, /* ior */
7 & 1, /* and */
};
static uint64_t u64_prev[4] = {
9, /* add */
7, /* xor */
6, /* ior */
7, /* and */
};
int
main (void)
{
size_t i;
u32_result[0] = amo_lwat_add (&u32_ld[0], 1);
u32_result[1] = amo_lwat_xor (&u32_ld[1], 1);
u32_result[2] = amo_lwat_ior (&u32_ld[2], 1);
u32_result[3] = amo_lwat_and (&u32_ld[3], 1);
u64_result[0] = amo_ldat_add (&u64_ld[0], 1);
u64_result[1] = amo_ldat_xor (&u64_ld[1], 1);
u64_result[2] = amo_ldat_ior (&u64_ld[2], 1);
u64_result[3] = amo_ldat_and (&u64_ld[3], 1);
amo_stwat_add (&u32_st[0], 1);
amo_stwat_xor (&u32_st[1], 1);
amo_stwat_ior (&u32_st[2], 1);
amo_stwat_and (&u32_st[3], 1);
amo_stdat_add (&u64_st[0], 1);
amo_stdat_xor (&u64_st[1], 1);
amo_stdat_ior (&u64_st[2], 1);
amo_stdat_and (&u64_st[3], 1);
for (i = 0; i < 4; i++)
{
if (u32_result[i] != u32_prev[i])
abort ();
if (u32_ld[i] != u32_update[i])
abort ();
if (u32_st[i] != u32_update[i])
abort ();
if (u64_result[i] != u64_prev[i])
abort ();
if (u64_ld[i] != u64_update[i])
abort ();
if (u64_st[i] != u64_update[i])
abort ();
}
return 0;
}
|