aboutsummaryrefslogtreecommitdiff
path: root/llvm/test/CodeGen/NVPTX/convert-call-to-indirect.ll
blob: 48209a8c886824fa5931db78b4d299ffe3cab810 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; RUN: llc < %s -march=nvptx64 -mcpu=sm_90 | FileCheck %s
; RUN: %if ptxas %{ llc < %s -march=nvptx64 -mcpu=sm_90 | %ptxas-verify -arch=sm_90 %}

%struct.64 = type <{ i64 }>
declare i64 @callee(ptr %p);
declare i64 @callee_variadic(ptr %p, ...);

define %struct.64 @test_return_type_mismatch(ptr %p) {
; CHECK-LABEL: test_return_type_mismatch(
; CHECK:       {
; CHECK-NEXT:    .reg .b64 %rd<40>;
; CHECK-EMPTY:
; CHECK-NEXT:  // %bb.0:
; CHECK-NEXT:    ld.param.b64 %rd2, [test_return_type_mismatch_param_0];
; CHECK-NEXT:    { // callseq 0, 0
; CHECK-NEXT:    .param .b64 param0;
; CHECK-NEXT:    .param .align 1 .b8 retval0[8];
; CHECK-NEXT:    st.param.b64 [param0], %rd2;
; CHECK-NEXT:    prototype_0 : .callprototype (.param .align 1 .b8 _[8]) _ (.param .b64 _);
; CHECK-NEXT:    mov.b64 %rd1, callee;
; CHECK-NEXT:    call (retval0), %rd1, (param0), prototype_0;
; CHECK-NEXT:    ld.param.b8 %rd3, [retval0+7];
; CHECK-NEXT:    ld.param.b8 %rd4, [retval0+6];
; CHECK-NEXT:    ld.param.b8 %rd5, [retval0+5];
; CHECK-NEXT:    ld.param.b8 %rd6, [retval0+4];
; CHECK-NEXT:    ld.param.b8 %rd7, [retval0+3];
; CHECK-NEXT:    ld.param.b8 %rd8, [retval0+2];
; CHECK-NEXT:    ld.param.b8 %rd9, [retval0+1];
; CHECK-NEXT:    ld.param.b8 %rd10, [retval0];
; CHECK-NEXT:    } // callseq 0
; CHECK-NEXT:    shl.b64 %rd13, %rd9, 8;
; CHECK-NEXT:    or.b64 %rd14, %rd13, %rd10;
; CHECK-NEXT:    shl.b64 %rd16, %rd8, 16;
; CHECK-NEXT:    shl.b64 %rd18, %rd7, 24;
; CHECK-NEXT:    or.b64 %rd19, %rd18, %rd16;
; CHECK-NEXT:    or.b64 %rd20, %rd19, %rd14;
; CHECK-NEXT:    shl.b64 %rd23, %rd5, 8;
; CHECK-NEXT:    or.b64 %rd24, %rd23, %rd6;
; CHECK-NEXT:    shl.b64 %rd26, %rd4, 16;
; CHECK-NEXT:    shl.b64 %rd28, %rd3, 24;
; CHECK-NEXT:    or.b64 %rd29, %rd28, %rd26;
; CHECK-NEXT:    or.b64 %rd30, %rd29, %rd24;
; CHECK-NEXT:    shl.b64 %rd31, %rd30, 32;
; CHECK-NEXT:    or.b64 %rd32, %rd31, %rd20;
; CHECK-NEXT:    st.param.b8 [func_retval0], %rd10;
; CHECK-NEXT:    shr.u64 %rd33, %rd32, 56;
; CHECK-NEXT:    st.param.b8 [func_retval0+7], %rd33;
; CHECK-NEXT:    shr.u64 %rd34, %rd32, 48;
; CHECK-NEXT:    st.param.b8 [func_retval0+6], %rd34;
; CHECK-NEXT:    shr.u64 %rd35, %rd32, 40;
; CHECK-NEXT:    st.param.b8 [func_retval0+5], %rd35;
; CHECK-NEXT:    shr.u64 %rd36, %rd32, 32;
; CHECK-NEXT:    st.param.b8 [func_retval0+4], %rd36;
; CHECK-NEXT:    shr.u64 %rd37, %rd32, 24;
; CHECK-NEXT:    st.param.b8 [func_retval0+3], %rd37;
; CHECK-NEXT:    shr.u64 %rd38, %rd32, 16;
; CHECK-NEXT:    st.param.b8 [func_retval0+2], %rd38;
; CHECK-NEXT:    shr.u64 %rd39, %rd32, 8;
; CHECK-NEXT:    st.param.b8 [func_retval0+1], %rd39;
; CHECK-NEXT:    ret;
  %ret = call %struct.64 @callee(ptr %p)
  ret %struct.64 %ret
}

define i64 @test_param_type_mismatch(ptr %p) {
; CHECK-LABEL: test_param_type_mismatch(
; CHECK:       {
; CHECK-NEXT:    .reg .b64 %rd<4>;
; CHECK-EMPTY:
; CHECK-NEXT:  // %bb.0:
; CHECK-NEXT:    { // callseq 1, 0
; CHECK-NEXT:    .param .b64 param0;
; CHECK-NEXT:    .param .b64 retval0;
; CHECK-NEXT:    prototype_1 : .callprototype (.param .b64 _) _ (.param .b64 _);
; CHECK-NEXT:    st.param.b64 [param0], 7;
; CHECK-NEXT:    mov.b64 %rd1, callee;
; CHECK-NEXT:    call (retval0), %rd1, (param0), prototype_1;
; CHECK-NEXT:    ld.param.b64 %rd2, [retval0];
; CHECK-NEXT:    } // callseq 1
; CHECK-NEXT:    st.param.b64 [func_retval0], %rd2;
; CHECK-NEXT:    ret;
  %ret = call i64 @callee(i64 7)
  ret i64 %ret
}

define i64 @test_param_count_mismatch(ptr %p) {
; CHECK-LABEL: test_param_count_mismatch(
; CHECK:       {
; CHECK-NEXT:    .reg .b64 %rd<5>;
; CHECK-EMPTY:
; CHECK-NEXT:  // %bb.0:
; CHECK-NEXT:    ld.param.b64 %rd2, [test_param_count_mismatch_param_0];
; CHECK-NEXT:    { // callseq 2, 0
; CHECK-NEXT:    .param .b64 param0;
; CHECK-NEXT:    .param .b64 param1;
; CHECK-NEXT:    .param .b64 retval0;
; CHECK-NEXT:    st.param.b64 [param0], %rd2;
; CHECK-NEXT:    prototype_2 : .callprototype (.param .b64 _) _ (.param .b64 _, .param .b64 _);
; CHECK-NEXT:    st.param.b64 [param1], 7;
; CHECK-NEXT:    mov.b64 %rd1, callee;
; CHECK-NEXT:    call (retval0), %rd1, (param0, param1), prototype_2;
; CHECK-NEXT:    ld.param.b64 %rd3, [retval0];
; CHECK-NEXT:    } // callseq 2
; CHECK-NEXT:    st.param.b64 [func_retval0], %rd3;
; CHECK-NEXT:    ret;
  %ret = call i64 @callee(ptr %p, i64 7)
  ret i64 %ret
}

define %struct.64 @test_return_type_mismatch_variadic(ptr %p) {
; CHECK-LABEL: test_return_type_mismatch_variadic(
; CHECK:       {
; CHECK-NEXT:    .reg .b64 %rd<40>;
; CHECK-EMPTY:
; CHECK-NEXT:  // %bb.0:
; CHECK-NEXT:    ld.param.b64 %rd2, [test_return_type_mismatch_variadic_param_0];
; CHECK-NEXT:    { // callseq 3, 0
; CHECK-NEXT:    .param .b64 param0;
; CHECK-NEXT:    .param .align 1 .b8 retval0[8];
; CHECK-NEXT:    st.param.b64 [param0], %rd2;
; CHECK-NEXT:    prototype_3 : .callprototype (.param .align 1 .b8 _[8]) _ (.param .b64 _);
; CHECK-NEXT:    mov.b64 %rd1, callee_variadic;
; CHECK-NEXT:    call (retval0), %rd1, (param0), prototype_3;
; CHECK-NEXT:    ld.param.b8 %rd3, [retval0+7];
; CHECK-NEXT:    ld.param.b8 %rd4, [retval0+6];
; CHECK-NEXT:    ld.param.b8 %rd5, [retval0+5];
; CHECK-NEXT:    ld.param.b8 %rd6, [retval0+4];
; CHECK-NEXT:    ld.param.b8 %rd7, [retval0+3];
; CHECK-NEXT:    ld.param.b8 %rd8, [retval0+2];
; CHECK-NEXT:    ld.param.b8 %rd9, [retval0+1];
; CHECK-NEXT:    ld.param.b8 %rd10, [retval0];
; CHECK-NEXT:    } // callseq 3
; CHECK-NEXT:    shl.b64 %rd13, %rd9, 8;
; CHECK-NEXT:    or.b64 %rd14, %rd13, %rd10;
; CHECK-NEXT:    shl.b64 %rd16, %rd8, 16;
; CHECK-NEXT:    shl.b64 %rd18, %rd7, 24;
; CHECK-NEXT:    or.b64 %rd19, %rd18, %rd16;
; CHECK-NEXT:    or.b64 %rd20, %rd19, %rd14;
; CHECK-NEXT:    shl.b64 %rd23, %rd5, 8;
; CHECK-NEXT:    or.b64 %rd24, %rd23, %rd6;
; CHECK-NEXT:    shl.b64 %rd26, %rd4, 16;
; CHECK-NEXT:    shl.b64 %rd28, %rd3, 24;
; CHECK-NEXT:    or.b64 %rd29, %rd28, %rd26;
; CHECK-NEXT:    or.b64 %rd30, %rd29, %rd24;
; CHECK-NEXT:    shl.b64 %rd31, %rd30, 32;
; CHECK-NEXT:    or.b64 %rd32, %rd31, %rd20;
; CHECK-NEXT:    st.param.b8 [func_retval0], %rd10;
; CHECK-NEXT:    shr.u64 %rd33, %rd32, 56;
; CHECK-NEXT:    st.param.b8 [func_retval0+7], %rd33;
; CHECK-NEXT:    shr.u64 %rd34, %rd32, 48;
; CHECK-NEXT:    st.param.b8 [func_retval0+6], %rd34;
; CHECK-NEXT:    shr.u64 %rd35, %rd32, 40;
; CHECK-NEXT:    st.param.b8 [func_retval0+5], %rd35;
; CHECK-NEXT:    shr.u64 %rd36, %rd32, 32;
; CHECK-NEXT:    st.param.b8 [func_retval0+4], %rd36;
; CHECK-NEXT:    shr.u64 %rd37, %rd32, 24;
; CHECK-NEXT:    st.param.b8 [func_retval0+3], %rd37;
; CHECK-NEXT:    shr.u64 %rd38, %rd32, 16;
; CHECK-NEXT:    st.param.b8 [func_retval0+2], %rd38;
; CHECK-NEXT:    shr.u64 %rd39, %rd32, 8;
; CHECK-NEXT:    st.param.b8 [func_retval0+1], %rd39;
; CHECK-NEXT:    ret;
  %ret = call %struct.64 (ptr, ...) @callee_variadic(ptr %p)
  ret %struct.64 %ret
}

define i64 @test_param_type_mismatch_variadic(ptr %p) {
; CHECK-LABEL: test_param_type_mismatch_variadic(
; CHECK:       {
; CHECK-NEXT:    .reg .b64 %rd<4>;
; CHECK-EMPTY:
; CHECK-NEXT:  // %bb.0:
; CHECK-NEXT:    ld.param.b64 %rd1, [test_param_type_mismatch_variadic_param_0];
; CHECK-NEXT:    { // callseq 4, 0
; CHECK-NEXT:    .param .align 8 .b8 param1[8];
; CHECK-NEXT:    .param .b64 param0;
; CHECK-NEXT:    .param .b64 retval0;
; CHECK-NEXT:    st.param.b64 [param0], %rd1;
; CHECK-NEXT:    st.param.b64 [param1], 7;
; CHECK-NEXT:    call.uni (retval0), callee_variadic, (param0, param1);
; CHECK-NEXT:    ld.param.b64 %rd2, [retval0];
; CHECK-NEXT:    } // callseq 4
; CHECK-NEXT:    st.param.b64 [func_retval0], %rd2;
; CHECK-NEXT:    ret;
  %ret = call i64 (ptr, ...) @callee_variadic(ptr %p, i64 7)
  ret i64 %ret
}

define i64 @test_param_count_mismatch_variadic(ptr %p) {
; CHECK-LABEL: test_param_count_mismatch_variadic(
; CHECK:       {
; CHECK-NEXT:    .reg .b64 %rd<4>;
; CHECK-EMPTY:
; CHECK-NEXT:  // %bb.0:
; CHECK-NEXT:    ld.param.b64 %rd1, [test_param_count_mismatch_variadic_param_0];
; CHECK-NEXT:    { // callseq 5, 0
; CHECK-NEXT:    .param .align 8 .b8 param1[8];
; CHECK-NEXT:    .param .b64 param0;
; CHECK-NEXT:    .param .b64 retval0;
; CHECK-NEXT:    st.param.b64 [param0], %rd1;
; CHECK-NEXT:    st.param.b64 [param1], 7;
; CHECK-NEXT:    call.uni (retval0), callee_variadic, (param0, param1);
; CHECK-NEXT:    ld.param.b64 %rd2, [retval0];
; CHECK-NEXT:    } // callseq 5
; CHECK-NEXT:    st.param.b64 [func_retval0], %rd2;
; CHECK-NEXT:    ret;
  %ret = call i64 (ptr, ...) @callee_variadic(ptr %p, i64 7)
  ret i64 %ret
}