aboutsummaryrefslogtreecommitdiff
path: root/llvm/test/CodeGen/PowerPC/cse-despite-rounding-mode.ll
blob: 876213736190f83bff1a2916b4ac14f195669a53 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
; The non-strictfp version of test/CodeGen/PowerPC/respect-rounding-mode.ll
; Without strictfp, CSE should be free to eliminate the repeated multiply
; and conversion instructions.
; RUN: llc -verify-machineinstrs --mtriple powerpc64le-unknown-linux-gnu \
; RUN:   -mcpu=pwr8 -ppc-asm-full-reg-names < %s | grep 'xvrdpic' | count 2
; RUN: llc -verify-machineinstrs --mtriple powerpc-unknown-linux-gnu \
; RUN:   -mcpu=pwr9 -ppc-asm-full-reg-names < %s | grep 'xvrdpic' | count 2
; RUN: llc -verify-machineinstrs --mtriple powerpc64le-unknown-linux-gnu \
; RUN:   -mcpu=pwr10 -ppc-asm-full-reg-names < %s | grep 'xvrdpic' | count 2

; RUN: llc -verify-machineinstrs --mtriple powerpc64le-unknown-linux-gnu \
; RUN:   -mcpu=pwr8 -ppc-asm-full-reg-names < %s | grep 'xvmuldp' | count 2
; RUN: llc -verify-machineinstrs --mtriple powerpc-unknown-linux-gnu \
; RUN:   -mcpu=pwr9 -ppc-asm-full-reg-names < %s | grep 'xvmuldp' | count 2
; RUN: llc -verify-machineinstrs --mtriple powerpc64le-unknown-linux-gnu \
; RUN:   -mcpu=pwr10 -ppc-asm-full-reg-names < %s | grep 'xvmuldp' | count 2
@IndirectCallPtr = dso_local local_unnamed_addr global ptr null, align 8

define dso_local signext i32 @func1() local_unnamed_addr #0 {
entry:
  tail call void @directCall() #0
  %0 = tail call <2 x double> @llvm.experimental.constrained.rint.v2f64(<2 x double> <double -9.990000e+01, double 9.990000e+01>, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
  %vecext = extractelement <2 x double> %0, i32 0
  %sub = tail call double @llvm.experimental.constrained.fsub.f64(double %vecext, double -9.900000e+01, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
  %conv = tail call i32 @llvm.experimental.constrained.fptosi.i32.f64(double %sub, metadata !"fpexcept.ignore") #0
  tail call void @directCall() #0
  %1 = tail call <2 x double> @llvm.experimental.constrained.rint.v2f64(<2 x double> <double -9.990000e+01, double 9.990000e+01>, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
  %vecext3 = extractelement <2 x double> %1, i32 1
  %cmp = tail call i1 @llvm.experimental.constrained.fcmp.f64(double %vecext3, double 9.900000e+01, metadata !"une", metadata !"fpexcept.ignore") #0
  br i1 %cmp, label %if.then, label %if.end

if.then:                                          ; preds = %entry
  tail call void @exit(i32 signext 2) #0
  unreachable

if.end:                                           ; preds = %entry
  ret i32 %conv
}

declare void @directCall(...) local_unnamed_addr

declare double @llvm.experimental.constrained.fsub.f64(double, double, metadata, metadata)

declare i32 @llvm.experimental.constrained.fptosi.i32.f64(double, metadata)

declare i1 @llvm.experimental.constrained.fcmp.f64(double, double, metadata, metadata)

declare void @exit(i32 signext) local_unnamed_addr

define dso_local signext i32 @func2() local_unnamed_addr #0 {
entry:
  %call = tail call <2 x double> @getvector1() #0
  %call1 = tail call <2 x double> @getvector2() #0
  tail call void @directCall() #0
  %mul = tail call <2 x double> @llvm.experimental.constrained.fmul.v2f64(<2 x double> %call, <2 x double> %call1, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
  %vecext = extractelement <2 x double> %mul, i32 0
  %cmp = tail call i1 @llvm.experimental.constrained.fcmp.f64(double %vecext, double 4.000000e+00, metadata !"oeq", metadata !"fpexcept.ignore") #0
  br i1 %cmp, label %cleanup, label %if.end

if.end:                                           ; preds = %entry
  tail call void @directCall() #0
  %mul10 = tail call <2 x double> @llvm.experimental.constrained.fmul.v2f64(<2 x double> %call, <2 x double> %call1, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
  %0 = tail call i32 @llvm.ppc.vsx.xvcmpeqdp.p(i32 2, <2 x double> %mul, <2 x double> %mul10) #0
  br label %cleanup

cleanup:                                          ; preds = %entry, %if.end
  %retval.0 = phi i32 [ %0, %if.end ], [ 11, %entry ]
  ret i32 %retval.0
}

declare <2 x double> @getvector1(...) local_unnamed_addr

declare <2 x double> @getvector2(...) local_unnamed_addr

declare <2 x double> @llvm.experimental.constrained.fmul.v2f64(<2 x double>, <2 x double>, metadata, metadata)

declare i32 @llvm.ppc.vsx.xvcmpeqdp.p(i32, <2 x double>, <2 x double>)

define dso_local signext i32 @func3() local_unnamed_addr #0 {
entry:
  %0 = load ptr, ptr @IndirectCallPtr, align 8
  tail call void %0() #0
  %1 = tail call <2 x double> @llvm.experimental.constrained.rint.v2f64(<2 x double> <double -9.990000e+01, double 9.990000e+01>, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
  %vecext = extractelement <2 x double> %1, i32 0
  %sub = tail call double @llvm.experimental.constrained.fsub.f64(double %vecext, double -9.900000e+01, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
  %conv = tail call i32 @llvm.experimental.constrained.fptosi.i32.f64(double %sub, metadata !"fpexcept.ignore") #0
  %2 = load ptr, ptr @IndirectCallPtr, align 8
  tail call void %2() #0
  %3 = tail call <2 x double> @llvm.experimental.constrained.rint.v2f64(<2 x double> <double -9.990000e+01, double 9.990000e+01>, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
  %vecext4 = extractelement <2 x double> %3, i32 1
  %cmp = tail call i1 @llvm.experimental.constrained.fcmp.f64(double %vecext4, double 9.900000e+01, metadata !"une", metadata !"fpexcept.ignore") #0
  br i1 %cmp, label %if.then, label %if.end

if.then:                                          ; preds = %entry
  tail call void @exit(i32 signext 2) #0
  unreachable

if.end:                                           ; preds = %entry
  ret i32 %conv
}

define dso_local signext i32 @func4() local_unnamed_addr #0 {
entry:
  %call = tail call <2 x double> @getvector1() #0
  %call1 = tail call <2 x double> @getvector2() #0
  %0 = load ptr, ptr @IndirectCallPtr, align 8
  tail call void %0() #0
  %mul = tail call <2 x double> @llvm.experimental.constrained.fmul.v2f64(<2 x double> %call, <2 x double> %call1, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
  %vecext = extractelement <2 x double> %mul, i32 0
  %cmp = tail call i1 @llvm.experimental.constrained.fcmp.f64(double %vecext, double 4.000000e+00, metadata !"oeq", metadata !"fpexcept.ignore") #0
  br i1 %cmp, label %cleanup, label %if.end

if.end:                                           ; preds = %entry
  %1 = load ptr, ptr @IndirectCallPtr, align 8
  tail call void %1() #0
  %mul11 = tail call <2 x double> @llvm.experimental.constrained.fmul.v2f64(<2 x double> %call, <2 x double> %call1, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
  %2 = tail call i32 @llvm.ppc.vsx.xvcmpeqdp.p(i32 2, <2 x double> %mul, <2 x double> %mul11) #0
  br label %cleanup

cleanup:                                          ; preds = %entry, %if.end
  %retval.0 = phi i32 [ %2, %if.end ], [ 11, %entry ]
  ret i32 %retval.0
}

declare <2 x double> @llvm.experimental.constrained.rint.v2f64(<2 x double>, metadata, metadata)

attributes #0 = { nounwind }