aboutsummaryrefslogtreecommitdiff
path: root/llvm/test/CodeGen/AMDGPU/trans-coexecution-hazard.mir
blob: fa27d689dd8dd67a669cc520eaf3aee67b054533 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
# RUN: llc -mtriple=amdgcn -mcpu=gfx1250 -run-pass post-RA-hazard-rec -o - %s | FileCheck -check-prefixes=GCN,GFX1250 %s
# RUN: llc -mtriple=amdgcn -mcpu=gfx1200 -run-pass post-RA-hazard-rec -o - %s | FileCheck -check-prefixes=GCN,GFX1200 %s

---
name:            trans_writes_valu_reads_hazard
body:            |
  bb.0:
    ; GFX1250-LABEL: name: trans_writes_valu_reads_hazard
    ; GFX1250: $vgpr1 = V_SQRT_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GFX1250-NEXT: V_NOP_e32 implicit $exec
    ; GFX1250-NEXT: $vgpr3 = V_ADD_F32_e32 $vgpr1, $vgpr2, implicit $mode, implicit $exec
    ;
    ; GFX1200-LABEL: name: trans_writes_valu_reads_hazard
    ; GFX1200: $vgpr1 = V_SQRT_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GFX1200-NEXT: $vgpr3 = V_ADD_F32_e32 $vgpr1, $vgpr2, implicit $mode, implicit $exec
    $vgpr1 = V_SQRT_F32_e32 $vgpr0, implicit $mode, implicit $exec
    $vgpr3 = V_ADD_F32_e32 $vgpr1, $vgpr2, implicit $mode, implicit $exec
...

---
name:            trans_writes_valu_valu_reads_hazard_covered
body:            |
  bb.0:
    ; GCN-LABEL: name: trans_writes_valu_valu_reads_hazard_covered
    ; GCN: $vgpr1 = V_SQRT_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GCN-NEXT: $vgpr2 = V_ADD_F32_e32 $vgpr2, $vgpr3, implicit $mode, implicit $exec
    ; GCN-NEXT: $vgpr4 = V_ADD_F32_e32 $vgpr1, $vgpr2, implicit $mode, implicit $exec
    $vgpr1 = V_SQRT_F32_e32 $vgpr0, implicit $mode, implicit $exec
    $vgpr2 = V_ADD_F32_e32 $vgpr2, $vgpr3, implicit $mode, implicit $exec
    $vgpr4 = V_ADD_F32_e32 $vgpr1, $vgpr2, implicit $mode, implicit $exec
...

---
name:            trans_writes_salu_valu_reads_hazard
body:            |
  bb.0:
    ; GFX1250-LABEL: name: trans_writes_salu_valu_reads_hazard
    ; GFX1250: $vgpr1 = V_SQRT_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GFX1250-NEXT: $sgpr2 = S_ADD_U32 $sgpr0, $sgpr1, implicit-def $scc
    ; GFX1250-NEXT: V_NOP_e32 implicit $exec
    ; GFX1250-NEXT: $vgpr4 = V_ADD_F32_e32 $vgpr1, $vgpr2, implicit $mode, implicit $exec
    ;
    ; GFX1200-LABEL: name: trans_writes_salu_valu_reads_hazard
    ; GFX1200: $vgpr1 = V_SQRT_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GFX1200-NEXT: $sgpr2 = S_ADD_U32 $sgpr0, $sgpr1, implicit-def $scc
    ; GFX1200-NEXT: $vgpr4 = V_ADD_F32_e32 $vgpr1, $vgpr2, implicit $mode, implicit $exec
    $vgpr1 = V_SQRT_F32_e32 $vgpr0, implicit $mode, implicit $exec
    $sgpr2 = S_ADD_U32 $sgpr0, $sgpr1, implicit-def $scc
    $vgpr4 = V_ADD_F32_e32 $vgpr1, $vgpr2, implicit $mode, implicit $exec
...

---
name:            trans_no_hazard
body:            |
  bb.0:
    ; GCN-LABEL: name: trans_no_hazard
    ; GCN: $vgpr1 = V_SQRT_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GCN-NEXT: $vgpr3 = V_ADD_F32_e32 $vgpr0, $vgpr2, implicit $mode, implicit $exec
    $vgpr1 = V_SQRT_F32_e32 $vgpr0, implicit $mode, implicit $exec
    $vgpr3 = V_ADD_F32_e32 $vgpr0, $vgpr2, implicit $mode, implicit $exec
...

---
name:            trans_reads_valu_writes_hazard
body:            |
  bb.0:
    ; GFX1250-LABEL: name: trans_reads_valu_writes_hazard
    ; GFX1250: $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GFX1250-NEXT: V_NOP_e32 implicit $exec
    ; GFX1250-NEXT: $vgpr0 = V_ADD_F32_e32 $vgpr2, $vgpr3, implicit $mode, implicit $exec
    ;
    ; GFX1200-LABEL: name: trans_reads_valu_writes_hazard
    ; GFX1200: $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GFX1200-NEXT: $vgpr0 = V_ADD_F32_e32 $vgpr2, $vgpr3, implicit $mode, implicit $exec
    $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    $vgpr0 = V_ADD_F32_e32 $vgpr2, $vgpr3, implicit $mode, implicit $exec
...

---
name:            trans_reads_valu_valu_writes_hazard_covered
body:            |
  bb.0:
    ; GCN-LABEL: name: trans_reads_valu_valu_writes_hazard_covered
    ; GCN: $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GCN-NEXT: $vgpr2 = V_ADD_F32_e32 $vgpr2, $vgpr3, implicit $mode, implicit $exec
    ; GCN-NEXT: $vgpr0 = V_ADD_F32_e32 $vgpr4, $vgpr2, implicit $mode, implicit $exec
    $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    $vgpr2 = V_ADD_F32_e32 $vgpr2, $vgpr3, implicit $mode, implicit $exec
    $vgpr0 = V_ADD_F32_e32 $vgpr4, $vgpr2, implicit $mode, implicit $exec
...

---
name:            trans_reads__salu_valu_writes_hazard
body:            |
  bb.0:
    ; GFX1250-LABEL: name: trans_reads__salu_valu_writes_hazard
    ; GFX1250: $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GFX1250-NEXT: $sgpr2 = S_ADD_U32 $sgpr0, $sgpr1, implicit-def $scc
    ; GFX1250-NEXT: V_NOP_e32 implicit $exec
    ; GFX1250-NEXT: $vgpr0 = V_ADD_F32_e32 $vgpr4, $vgpr2, implicit $mode, implicit $exec
    ;
    ; GFX1200-LABEL: name: trans_reads__salu_valu_writes_hazard
    ; GFX1200: $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GFX1200-NEXT: $sgpr2 = S_ADD_U32 $sgpr0, $sgpr1, implicit-def $scc
    ; GFX1200-NEXT: $vgpr0 = V_ADD_F32_e32 $vgpr4, $vgpr2, implicit $mode, implicit $exec
    $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    $sgpr2 = S_ADD_U32 $sgpr0, $sgpr1, implicit-def $scc
    $vgpr0 = V_ADD_F32_e32 $vgpr4, $vgpr2, implicit $mode, implicit $exec
...

---
name:            trans_writes_trans_reads_no_hazard
body:            |
  bb.0:
    ; GCN-LABEL: name: trans_writes_trans_reads_no_hazard
    ; GCN: $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GCN-NEXT: $vgpr2 = V_SQRT_F32_e32 $vgpr1, implicit $mode, implicit $exec
    $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    $vgpr2 = V_SQRT_F32_e32 $vgpr1, implicit $mode, implicit $exec
...

---
name:            trans_reads_trans_writes_no_hazard
body:            |
  bb.0:
    ; GCN-LABEL: name: trans_reads_trans_writes_no_hazard
    ; GCN: $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    ; GCN-NEXT: $vgpr0 = V_SQRT_F32_e32 $vgpr2, implicit $mode, implicit $exec
    $vgpr1 = V_COS_F32_e32 $vgpr0, implicit $mode, implicit $exec
    $vgpr0 = V_SQRT_F32_e32 $vgpr2, implicit $mode, implicit $exec
...