aboutsummaryrefslogtreecommitdiff
path: root/llvm/test/CodeGen/AMDGPU/loop_header_nopred.mir
blob: 05cfe5322458228015ff34d3f5412cebe5866597 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
# RUN: llc -mtriple=amdgcn -o - -run-pass=block-placement -mcpu=gfx1010 -mattr=-inst-fwd-prefetch-bug -verify-machineinstrs %s | FileCheck -check-prefixes=GFX10 %s
# RUN: llc -mtriple=amdgcn -o - -run-pass=block-placement -mcpu=gfx1100 -mattr=-inst-fwd-prefetch-bug -verify-machineinstrs %s | FileCheck -check-prefixes=GFX11 %s

# RUN: llc -mtriple=amdgcn -o - -passes='require<profile-summary>,function(machine-function(block-placement<tail-merge>))' -mcpu=gfx1100 -mattr=-inst-fwd-prefetch-bug -verify-machineinstrs %s | FileCheck -check-prefixes=GFX11 %s

# Used to fail with
# Assertion `Out && "Header of loop has no predecessors from outside loop?"

---
name:            loop_header_nopred
body:             |
  ; GFX10-LABEL: name: loop_header_nopred
  ; GFX10: bb.0:
  ; GFX10-NEXT:   successors: %bb.2(0x80000000)
  ; GFX10-NEXT: {{  $}}
  ; GFX10-NEXT:   S_BRANCH %bb.2
  ; GFX10-NEXT: {{  $}}
  ; GFX10-NEXT: bb.1 (align 64):
  ; GFX10-NEXT:   successors: %bb.7(0x04000000), %bb.2(0x7c000000)
  ; GFX10-NEXT: {{  $}}
  ; GFX10-NEXT:   S_CBRANCH_VCCNZ %bb.7, implicit $vcc_lo
  ; GFX10-NEXT: {{  $}}
  ; GFX10-NEXT: bb.2:
  ; GFX10-NEXT:   successors: %bb.5(0x40000000), %bb.1(0x40000000)
  ; GFX10-NEXT: {{  $}}
  ; GFX10-NEXT:   S_CBRANCH_EXECZ %bb.1, implicit $exec
  ; GFX10-NEXT: {{  $}}
  ; GFX10-NEXT: bb.5:
  ; GFX10-NEXT:   successors: %bb.1(0x04000000), %bb.5(0x7c000000)
  ; GFX10-NEXT: {{  $}}
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_NOP 0
  ; GFX10-NEXT:   S_CBRANCH_EXECZ %bb.5, implicit $exec
  ; GFX10-NEXT:   S_BRANCH %bb.1
  ; GFX10-NEXT: {{  $}}
  ; GFX10-NEXT: bb.7:
  ; GFX10-NEXT:   S_ENDPGM 0
  ;
  ; GFX11-LABEL: name: loop_header_nopred
  ; GFX11: bb.0:
  ; GFX11-NEXT:   successors: %bb.2(0x80000000)
  ; GFX11-NEXT: {{  $}}
  ; GFX11-NEXT:   S_BRANCH %bb.2
  ; GFX11-NEXT: {{  $}}
  ; GFX11-NEXT: bb.1:
  ; GFX11-NEXT:   successors: %bb.7(0x04000000), %bb.2(0x7c000000)
  ; GFX11-NEXT: {{  $}}
  ; GFX11-NEXT:   S_CBRANCH_VCCNZ %bb.7, implicit $vcc_lo
  ; GFX11-NEXT: {{  $}}
  ; GFX11-NEXT: bb.2:
  ; GFX11-NEXT:   successors: %bb.5(0x40000000), %bb.1(0x40000000)
  ; GFX11-NEXT: {{  $}}
  ; GFX11-NEXT:   S_CBRANCH_EXECZ %bb.1, implicit $exec
  ; GFX11-NEXT: {{  $}}
  ; GFX11-NEXT: bb.5:
  ; GFX11-NEXT:   successors: %bb.1(0x04000000), %bb.5(0x7c000000)
  ; GFX11-NEXT: {{  $}}
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_NOP 0
  ; GFX11-NEXT:   S_CBRANCH_EXECZ %bb.5, implicit $exec
  ; GFX11-NEXT:   S_BRANCH %bb.1
  ; GFX11-NEXT: {{  $}}
  ; GFX11-NEXT: bb.7:
  ; GFX11-NEXT:   S_ENDPGM 0
  bb.0:
    successors: %bb.1(0x80000000)

  bb.1:
    successors: %bb.2(0x40000000), %bb.3(0x40000000)

    S_CBRANCH_VCCZ %bb.3, implicit $vcc
    S_BRANCH %bb.2

  bb.2:
    successors: %bb.3(0x80000000)

  bb.3:
    successors: %bb.4(0x40000000), %bb.6(0x40000000)

    S_CBRANCH_EXECZ %bb.6, implicit $exec
    S_BRANCH %bb.4

  bb.4:
    successors: %bb.5(0x04000000), %bb.4(0x7c000000)

    S_NOP 0
    S_NOP 0
    S_NOP 0
    S_NOP 0
    S_NOP 0
    S_NOP 0
    S_NOP 0
    S_NOP 0
    S_NOP 0
    S_NOP 0
    S_NOP 0
    S_CBRANCH_EXECZ %bb.4, implicit $exec

  bb.5:
    successors: %bb.6(0x80000000)

  bb.6:
    successors: %bb.7(0x04000000), %bb.1(0x7c000000)

    S_CBRANCH_VCCZ %bb.1, implicit $vcc

  bb.7:
    S_ENDPGM 0
...