1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
|
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 3
; RUN: llc < %s -mtriple=x86_64-unknown-unknown | FileCheck %s
; Cold function, %dup should not be duplicated into predecessors.
define i32 @cold(i32 %a, ptr %p, ptr %q) !prof !21 {
; CHECK-LABEL: cold:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: cmpl $2, %edi
; CHECK-NEXT: jl .LBB0_2
; CHECK-NEXT: # %bb.1: # %true1
; CHECK-NEXT: movl (%rsi), %eax
; CHECK-NEXT: addl $2, %eax
; CHECK-NEXT: .LBB0_3: # %dup
; CHECK-NEXT: cmpl $5, %eax
; CHECK-NEXT: jl .LBB0_5
; CHECK-NEXT: # %bb.4: # %true2
; CHECK-NEXT: xorl %edi, %eax
; CHECK-NEXT: retq
; CHECK-NEXT: .LBB0_2: # %false1
; CHECK-NEXT: movl (%rdx), %eax
; CHECK-NEXT: addl $-3, %eax
; CHECK-NEXT: jmp .LBB0_3
; CHECK-NEXT: .LBB0_5: # %false2
; CHECK-NEXT: andl %edi, %eax
; CHECK-NEXT: retq
entry:
%cond1 = icmp sgt i32 %a, 1
br i1 %cond1, label %true1, label %false1, !prof !30
true1:
%v1 = load i32, ptr %p, align 4
%v2 = add i32 %v1, 2
br label %dup
false1:
%v3 = load i32, ptr %q, align 4
%v4 = sub i32 %v3, 3
br label %dup
dup:
%v5 = phi i32 [%v2, %true1], [%v4, %false1]
%cond2 = icmp sgt i32 %v5, 4
br i1 %cond2, label %true2, label %false2, !prof !30
true2:
%v6 = xor i32 %v5, %a
br label %exit
false2:
%v7 = and i32 %v5, %a
br label %exit
exit:
%v8 = phi i32 [%v6, %true2], [%v7, %false2]
ret i32 %v8
}
; Same code as previous function, but with hot profile count.
; So %dup should be duplicated into predecessors.
define i32 @hot(i32 %a, ptr %p, ptr %q) !prof !22 {
; CHECK-LABEL: hot:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: cmpl $2, %edi
; CHECK-NEXT: jl .LBB1_2
; CHECK-NEXT: # %bb.1: # %true1
; CHECK-NEXT: movl (%rsi), %eax
; CHECK-NEXT: addl $2, %eax
; CHECK-NEXT: cmpl $5, %eax
; CHECK-NEXT: jge .LBB1_4
; CHECK-NEXT: .LBB1_5: # %false2
; CHECK-NEXT: andl %edi, %eax
; CHECK-NEXT: retq
; CHECK-NEXT: .LBB1_2: # %false1
; CHECK-NEXT: movl (%rdx), %eax
; CHECK-NEXT: addl $-3, %eax
; CHECK-NEXT: cmpl $5, %eax
; CHECK-NEXT: jl .LBB1_5
; CHECK-NEXT: .LBB1_4: # %true2
; CHECK-NEXT: xorl %edi, %eax
; CHECK-NEXT: retq
entry:
%cond1 = icmp sgt i32 %a, 1
br i1 %cond1, label %true1, label %false1, !prof !30
true1:
%v1 = load i32, ptr %p, align 4
%v2 = add i32 %v1, 2
br label %dup
false1:
%v3 = load i32, ptr %q, align 4
%v4 = sub i32 %v3, 3
br label %dup
dup:
%v5 = phi i32 [%v2, %true1], [%v4, %false1]
%cond2 = icmp sgt i32 %v5, 4
br i1 %cond2, label %true2, label %false2, !prof !30
true2:
%v6 = xor i32 %v5, %a
br label %exit
false2:
%v7 = and i32 %v5, %a
br label %exit
exit:
%v8 = phi i32 [%v6, %true2], [%v7, %false2]
ret i32 %v8
}
!llvm.module.flags = !{!1}
!21 = !{!"function_entry_count", i64 10}
!22 = !{!"function_entry_count", i64 400}
!30 = !{!"branch_weights", i32 1, i32 1}
!1 = !{i32 1, !"ProfileSummary", !2}
!2 = !{!3, !4, !5, !6, !7, !8, !9, !10}
!3 = !{!"ProfileFormat", !"InstrProf"}
!4 = !{!"TotalCount", i64 10000}
!5 = !{!"MaxCount", i64 10}
!6 = !{!"MaxInternalCount", i64 1}
!7 = !{!"MaxFunctionCount", i64 1000}
!8 = !{!"NumCounts", i64 3}
!9 = !{!"NumFunctions", i64 3}
!10 = !{!"DetailedSummary", !11}
!11 = !{!12, !13, !14}
!12 = !{i32 10000, i64 100, i32 1}
!13 = !{i32 999000, i64 100, i32 1}
!14 = !{i32 999999, i64 1, i32 2}
|