1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
|
; RUN: llc -verify-machineinstrs -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
; RUN: -mcpu=pwr8 -mtriple=powerpc64le < %s | FileCheck %s
; RUN: llc -verify-machineinstrs -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
; RUN: -mcpu=pwr8 -mtriple=powerpc64 < %s | FileCheck %s
%struct.d = type { [131072 x i32] }
@a = dso_local local_unnamed_addr global [4096 x i32] zeroinitializer, align 4
; Function Attrs: mustprogress uwtable
define dso_local void @_Z1g1dILi17EE(ptr nocapture noundef readnone byval(%struct.d) align 8 %0) local_unnamed_addr #0 {
; CHECK-LABEL: _Z1g1dILi17EE:
; CHECK-NOT: mtfprd f0, r4
; CHECK-NOT: stdx r3, r1, r4
; CHECK-NOT: mffprd r4, f0
; CHECK-NOT: mtfprd f0, r4
; CHECK-NOT: ldx r3, r1, r4
; CHECK-NOT: mffprd r4, f0
; CHECK-NOT: mtfprd f0, r4
; CHECK-NOT: stdx r3, r1, r4
; CHECK-NOT: mffprd r4, f0
; CHECK-NOT: mtfprd f0, r4
; CHECK-NOT: ldx r3, r1, r4
; CHECK-NOT: mffprd r4, f0
entry:
%c = alloca %struct.d, align 8
call void @llvm.lifetime.start.p0(i64 524288, ptr nonnull %c) #3
br label %vector.body
vector.body: ; preds = %vector.body.1, %entry
%index = phi i64 [ 0, %entry ], [ %index.next.1, %vector.body.1 ]
%vec.ind = phi <4 x i32> [ <i32 0, i32 1, i32 2, i32 3>, %entry ], [ %vec.ind.next.1, %vector.body.1 ]
%step.add = add <4 x i32> %vec.ind, <i32 4, i32 4, i32 4, i32 4>
%step.add24 = add <4 x i32> %vec.ind, <i32 8, i32 8, i32 8, i32 8>
%step.add25 = add <4 x i32> %vec.ind, <i32 12, i32 12, i32 12, i32 12>
%step.add26 = add <4 x i32> %vec.ind, <i32 16, i32 16, i32 16, i32 16>
%step.add27 = add <4 x i32> %vec.ind, <i32 20, i32 20, i32 20, i32 20>
%step.add28 = add <4 x i32> %vec.ind, <i32 24, i32 24, i32 24, i32 24>
%step.add29 = add <4 x i32> %vec.ind, <i32 28, i32 28, i32 28, i32 28>
%step.add30 = add <4 x i32> %vec.ind, <i32 32, i32 32, i32 32, i32 32>
%step.add31 = add <4 x i32> %vec.ind, <i32 36, i32 36, i32 36, i32 36>
%step.add32 = add <4 x i32> %vec.ind, <i32 40, i32 40, i32 40, i32 40>
%step.add33 = add <4 x i32> %vec.ind, <i32 44, i32 44, i32 44, i32 44>
%1 = getelementptr inbounds [4096 x i32], ptr @a, i64 0, i64 %index
store <4 x i32> %vec.ind, ptr %1, align 4
%2 = getelementptr inbounds i32, ptr %1, i64 4
store <4 x i32> %step.add, ptr %2, align 4
%3 = getelementptr inbounds i32, ptr %1, i64 8
store <4 x i32> %step.add24, ptr %3, align 4
%4 = getelementptr inbounds i32, ptr %1, i64 12
store <4 x i32> %step.add25, ptr %4, align 4
%5 = getelementptr inbounds i32, ptr %1, i64 16
store <4 x i32> %step.add26, ptr %5, align 4
%6 = getelementptr inbounds i32, ptr %1, i64 20
store <4 x i32> %step.add27, ptr %6, align 4
%7 = getelementptr inbounds i32, ptr %1, i64 24
store <4 x i32> %step.add28, ptr %7, align 4
%8 = getelementptr inbounds i32, ptr %1, i64 28
store <4 x i32> %step.add29, ptr %8, align 4
%9 = getelementptr inbounds i32, ptr %1, i64 32
store <4 x i32> %step.add30, ptr %9, align 4
%10 = getelementptr inbounds i32, ptr %1, i64 36
store <4 x i32> %step.add31, ptr %10, align 4
%11 = getelementptr inbounds i32, ptr %1, i64 40
store <4 x i32> %step.add32, ptr %11, align 4
%12 = getelementptr inbounds i32, ptr %1, i64 44
store <4 x i32> %step.add33, ptr %12, align 4
%index.next = add nuw nsw i64 %index, 48
%13 = icmp eq i64 %index.next, 4080
br i1 %13, label %for.body, label %vector.body.1
vector.body.1: ; preds = %vector.body
%vec.ind.next = add <4 x i32> %vec.ind, <i32 48, i32 48, i32 48, i32 48>
%step.add.1 = add <4 x i32> %vec.ind, <i32 52, i32 52, i32 52, i32 52>
%step.add24.1 = add <4 x i32> %vec.ind, <i32 56, i32 56, i32 56, i32 56>
%step.add25.1 = add <4 x i32> %vec.ind, <i32 60, i32 60, i32 60, i32 60>
%step.add26.1 = add <4 x i32> %vec.ind, <i32 64, i32 64, i32 64, i32 64>
%step.add27.1 = add <4 x i32> %vec.ind, <i32 68, i32 68, i32 68, i32 68>
%step.add28.1 = add <4 x i32> %vec.ind, <i32 72, i32 72, i32 72, i32 72>
%step.add29.1 = add <4 x i32> %vec.ind, <i32 76, i32 76, i32 76, i32 76>
%step.add30.1 = add <4 x i32> %vec.ind, <i32 80, i32 80, i32 80, i32 80>
%step.add31.1 = add <4 x i32> %vec.ind, <i32 84, i32 84, i32 84, i32 84>
%step.add32.1 = add <4 x i32> %vec.ind, <i32 88, i32 88, i32 88, i32 88>
%step.add33.1 = add <4 x i32> %vec.ind, <i32 92, i32 92, i32 92, i32 92>
%14 = getelementptr inbounds [4096 x i32], ptr @a, i64 0, i64 %index.next
store <4 x i32> %vec.ind.next, ptr %14, align 4
%15 = getelementptr inbounds i32, ptr %14, i64 4
store <4 x i32> %step.add.1, ptr %15, align 4
%16 = getelementptr inbounds i32, ptr %14, i64 8
store <4 x i32> %step.add24.1, ptr %16, align 4
%17 = getelementptr inbounds i32, ptr %14, i64 12
store <4 x i32> %step.add25.1, ptr %17, align 4
%18 = getelementptr inbounds i32, ptr %14, i64 16
store <4 x i32> %step.add26.1, ptr %18, align 4
%19 = getelementptr inbounds i32, ptr %14, i64 20
store <4 x i32> %step.add27.1, ptr %19, align 4
%20 = getelementptr inbounds i32, ptr %14, i64 24
store <4 x i32> %step.add28.1, ptr %20, align 4
%21 = getelementptr inbounds i32, ptr %14, i64 28
store <4 x i32> %step.add29.1, ptr %21, align 4
%22 = getelementptr inbounds i32, ptr %14, i64 32
store <4 x i32> %step.add30.1, ptr %22, align 4
%23 = getelementptr inbounds i32, ptr %14, i64 36
store <4 x i32> %step.add31.1, ptr %23, align 4
%24 = getelementptr inbounds i32, ptr %14, i64 40
store <4 x i32> %step.add32.1, ptr %24, align 4
%25 = getelementptr inbounds i32, ptr %14, i64 44
store <4 x i32> %step.add33.1, ptr %25, align 4
%index.next.1 = add nuw nsw i64 %index, 96
%vec.ind.next.1 = add <4 x i32> %vec.ind, <i32 96, i32 96, i32 96, i32 96>
br label %vector.body
vector.body40: ; preds = %vector.body40.1, %for.body
%index41 = phi i64 [ 0, %for.body ], [ %index.next56.1, %vector.body40.1 ]
%vec.ind42 = phi <4 x i32> [ <i32 0, i32 1, i32 2, i32 3>, %for.body ], [ %vec.ind.next55.1, %vector.body40.1 ]
%step.add43 = add <4 x i32> %vec.ind42, <i32 4, i32 4, i32 4, i32 4>
%step.add44 = add <4 x i32> %vec.ind42, <i32 8, i32 8, i32 8, i32 8>
%step.add45 = add <4 x i32> %vec.ind42, <i32 12, i32 12, i32 12, i32 12>
%step.add46 = add <4 x i32> %vec.ind42, <i32 16, i32 16, i32 16, i32 16>
%step.add47 = add <4 x i32> %vec.ind42, <i32 20, i32 20, i32 20, i32 20>
%step.add48 = add <4 x i32> %vec.ind42, <i32 24, i32 24, i32 24, i32 24>
%step.add49 = add <4 x i32> %vec.ind42, <i32 28, i32 28, i32 28, i32 28>
%step.add50 = add <4 x i32> %vec.ind42, <i32 32, i32 32, i32 32, i32 32>
%step.add51 = add <4 x i32> %vec.ind42, <i32 36, i32 36, i32 36, i32 36>
%step.add52 = add <4 x i32> %vec.ind42, <i32 40, i32 40, i32 40, i32 40>
%step.add53 = add <4 x i32> %vec.ind42, <i32 44, i32 44, i32 44, i32 44>
%26 = getelementptr inbounds [4096 x i32], ptr @a, i64 0, i64 %index41
store <4 x i32> %vec.ind42, ptr %26, align 4
%27 = getelementptr inbounds i32, ptr %26, i64 4
store <4 x i32> %step.add43, ptr %27, align 4
%28 = getelementptr inbounds i32, ptr %26, i64 8
store <4 x i32> %step.add44, ptr %28, align 4
%29 = getelementptr inbounds i32, ptr %26, i64 12
store <4 x i32> %step.add45, ptr %29, align 4
%30 = getelementptr inbounds i32, ptr %26, i64 16
store <4 x i32> %step.add46, ptr %30, align 4
%31 = getelementptr inbounds i32, ptr %26, i64 20
store <4 x i32> %step.add47, ptr %31, align 4
%32 = getelementptr inbounds i32, ptr %26, i64 24
store <4 x i32> %step.add48, ptr %32, align 4
%33 = getelementptr inbounds i32, ptr %26, i64 28
store <4 x i32> %step.add49, ptr %33, align 4
%34 = getelementptr inbounds i32, ptr %26, i64 32
store <4 x i32> %step.add50, ptr %34, align 4
%35 = getelementptr inbounds i32, ptr %26, i64 36
store <4 x i32> %step.add51, ptr %35, align 4
%36 = getelementptr inbounds i32, ptr %26, i64 40
store <4 x i32> %step.add52, ptr %36, align 4
%37 = getelementptr inbounds i32, ptr %26, i64 44
store <4 x i32> %step.add53, ptr %37, align 4
%index.next56 = add nuw nsw i64 %index41, 48
%38 = icmp eq i64 %index.next56, 4080
br i1 %38, label %for.body5, label %vector.body40.1
vector.body40.1: ; preds = %vector.body40
%vec.ind.next55 = add <4 x i32> %vec.ind42, <i32 48, i32 48, i32 48, i32 48>
%step.add43.1 = add <4 x i32> %vec.ind42, <i32 52, i32 52, i32 52, i32 52>
%step.add44.1 = add <4 x i32> %vec.ind42, <i32 56, i32 56, i32 56, i32 56>
%step.add45.1 = add <4 x i32> %vec.ind42, <i32 60, i32 60, i32 60, i32 60>
%step.add46.1 = add <4 x i32> %vec.ind42, <i32 64, i32 64, i32 64, i32 64>
%step.add47.1 = add <4 x i32> %vec.ind42, <i32 68, i32 68, i32 68, i32 68>
%step.add48.1 = add <4 x i32> %vec.ind42, <i32 72, i32 72, i32 72, i32 72>
%step.add49.1 = add <4 x i32> %vec.ind42, <i32 76, i32 76, i32 76, i32 76>
%step.add50.1 = add <4 x i32> %vec.ind42, <i32 80, i32 80, i32 80, i32 80>
%step.add51.1 = add <4 x i32> %vec.ind42, <i32 84, i32 84, i32 84, i32 84>
%step.add52.1 = add <4 x i32> %vec.ind42, <i32 88, i32 88, i32 88, i32 88>
%step.add53.1 = add <4 x i32> %vec.ind42, <i32 92, i32 92, i32 92, i32 92>
%39 = getelementptr inbounds [4096 x i32], ptr @a, i64 0, i64 %index.next56
store <4 x i32> %vec.ind.next55, ptr %39, align 4
%40 = getelementptr inbounds i32, ptr %39, i64 4
store <4 x i32> %step.add43.1, ptr %40, align 4
%41 = getelementptr inbounds i32, ptr %39, i64 8
store <4 x i32> %step.add44.1, ptr %41, align 4
%42 = getelementptr inbounds i32, ptr %39, i64 12
store <4 x i32> %step.add45.1, ptr %42, align 4
%43 = getelementptr inbounds i32, ptr %39, i64 16
store <4 x i32> %step.add46.1, ptr %43, align 4
%44 = getelementptr inbounds i32, ptr %39, i64 20
store <4 x i32> %step.add47.1, ptr %44, align 4
%45 = getelementptr inbounds i32, ptr %39, i64 24
store <4 x i32> %step.add48.1, ptr %45, align 4
%46 = getelementptr inbounds i32, ptr %39, i64 28
store <4 x i32> %step.add49.1, ptr %46, align 4
%47 = getelementptr inbounds i32, ptr %39, i64 32
store <4 x i32> %step.add50.1, ptr %47, align 4
%48 = getelementptr inbounds i32, ptr %39, i64 36
store <4 x i32> %step.add51.1, ptr %48, align 4
%49 = getelementptr inbounds i32, ptr %39, i64 40
store <4 x i32> %step.add52.1, ptr %49, align 4
%50 = getelementptr inbounds i32, ptr %39, i64 44
store <4 x i32> %step.add53.1, ptr %50, align 4
%index.next56.1 = add nuw nsw i64 %index41, 96
%vec.ind.next55.1 = add <4 x i32> %vec.ind42, <i32 96, i32 96, i32 96, i32 96>
br label %vector.body40
for.body: ; preds = %vector.body
store i32 4080, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4080), align 4
store i32 4081, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4081), align 4
store i32 4082, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4082), align 4
store i32 4083, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4083), align 4
store i32 4084, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4084), align 4
store i32 4085, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4085), align 4
store i32 4086, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4086), align 4
store i32 4087, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4087), align 4
store i32 4088, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4088), align 4
store i32 4089, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4089), align 4
store i32 4090, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4090), align 4
store i32 4091, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4091), align 4
store i32 4092, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4092), align 4
store i32 4093, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4093), align 4
store i32 4094, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4094), align 4
store i32 4095, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4095), align 4
call void @_ZN1dILi17EE1eEv(ptr noundef nonnull align 4 dereferenceable(524288) %c)
br label %vector.body40
for.body5: ; preds = %vector.body40
store i32 4080, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4080), align 4
store i32 4081, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4081), align 4
store i32 4082, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4082), align 4
store i32 4083, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4083), align 4
store i32 4084, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4084), align 4
store i32 4085, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4085), align 4
store i32 4086, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4086), align 4
store i32 4087, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4087), align 4
store i32 4088, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4088), align 4
store i32 4089, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4089), align 4
store i32 4090, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4090), align 4
store i32 4091, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4091), align 4
store i32 4092, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4092), align 4
store i32 4093, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4093), align 4
store i32 4094, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4094), align 4
store i32 4095, ptr getelementptr inbounds ([4096 x i32], ptr @a, i64 0, i64 4095), align 4
call void @_Z1h1dILi17EE(ptr noundef nonnull byval(%struct.d) align 8 %c)
call void @llvm.lifetime.end.p0(i64 524288, ptr nonnull %c) #3
ret void
}
; Function Attrs: argmemonly mustprogress nocallback nofree nosync nounwind willreturn
declare void @llvm.lifetime.start.p0(i64 immarg, ptr nocapture) #1
; Function Attrs: argmemonly mustprogress nocallback nofree nosync nounwind willreturn
declare void @llvm.lifetime.end.p0(i64 immarg, ptr nocapture) #1
declare void @_ZN1dILi17EE1eEv(ptr noundef nonnull align 4 dereferenceable(524288)) local_unnamed_addr #2
declare void @_Z1h1dILi17EE(ptr noundef byval(%struct.d) align 8) local_unnamed_addr #2
attributes #0 = { nounwind }
|