diff options
Diffstat (limited to 'llvm/test/Transforms')
24 files changed, 1259 insertions, 732 deletions
| diff --git a/llvm/test/Transforms/InstSimplify/ConstProp/vecreduce.ll b/llvm/test/Transforms/InstSimplify/ConstProp/vecreduce.ll index 77a7f0d..479b3f8 100644 --- a/llvm/test/Transforms/InstSimplify/ConstProp/vecreduce.ll +++ b/llvm/test/Transforms/InstSimplify/ConstProp/vecreduce.ll @@ -12,8 +12,7 @@ define i32 @add_0() {  define i32 @add_0_scalable_vector() {  ; CHECK-LABEL: @add_0_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.add.nxv8i32(<vscale x 8 x i32> zeroinitializer) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 0  ;    %x = call i32 @llvm.vector.reduce.add.nxv8i32(<vscale x 8 x i32> zeroinitializer)    ret i32 %x @@ -89,8 +88,7 @@ define i32 @add_poison() {  define i32 @add_poison_scalable_vector() {  ; CHECK-LABEL: @add_poison_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.add.nxv8i32(<vscale x 8 x i32> poison) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 poison  ;    %x = call i32 @llvm.vector.reduce.add.nxv8i32(<vscale x 8 x i32> poison)    ret i32 %x @@ -123,8 +121,7 @@ define i32 @mul_0() {  define i32 @mul_0_scalable_vector() {  ; CHECK-LABEL: @mul_0_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.mul.nxv8i32(<vscale x 8 x i32> zeroinitializer) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 0  ;    %x = call i32 @llvm.vector.reduce.mul.nxv8i32(<vscale x 8 x i32> zeroinitializer)    ret i32 %x @@ -140,13 +137,29 @@ define i32 @mul_1() {  define i32 @mul_1_scalable_vector() {  ; CHECK-LABEL: @mul_1_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.mul.nxv8i32(<vscale x 8 x i32> splat (i32 1)) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 1  ;    %x = call i32 @llvm.vector.reduce.mul.nxv8i32(<vscale x 8 x i32> splat (i32 1))    ret i32 %x  } +define i32 @mul_2() { +; CHECK-LABEL: @mul_2( +; CHECK-NEXT:    ret i32 256 +; +  %x = call i32 @llvm.vector.reduce.mul.v8i32(<8 x i32> <i32 2, i32 2, i32 2, i32 2, i32 2, i32 2, i32 2, i32 2>) +  ret i32 %x +} + +define i32 @mul_2_scalable_vector() { +; CHECK-LABEL: @mul_2_scalable_vector( +; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.mul.nxv8i32(<vscale x 8 x i32> splat (i32 2)) +; CHECK-NEXT:    ret i32 [[X]] +; +  %x = call i32 @llvm.vector.reduce.mul.nxv8i32(<vscale x 8 x i32> splat (i32 2)) +  ret i32 %x +} +  define i32 @mul_inc() {  ; CHECK-LABEL: @mul_inc(  ; CHECK-NEXT:    ret i32 40320 @@ -200,8 +213,7 @@ define i32 @mul_poison() {  define i32 @mul_poison_scalable_vector() {  ; CHECK-LABEL: @mul_poison_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.mul.nxv8i32(<vscale x 8 x i32> poison) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 poison  ;    %x = call i32 @llvm.vector.reduce.mul.nxv8i32(<vscale x 8 x i32> poison)    ret i32 %x @@ -225,8 +237,7 @@ define i32 @and_0() {  define i32 @and_0_scalable_vector() {  ; CHECK-LABEL: @and_0_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.and.nxv8i32(<vscale x 8 x i32> zeroinitializer) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 0  ;    %x = call i32 @llvm.vector.reduce.and.nxv8i32(<vscale x 8 x i32> zeroinitializer)    ret i32 %x @@ -242,8 +253,7 @@ define i32 @and_1() {  define i32 @and_1_scalable_vector() {  ; CHECK-LABEL: @and_1_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.and.nxv8i32(<vscale x 8 x i32> splat (i32 1)) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 1  ;    %x = call i32 @llvm.vector.reduce.and.nxv8i32(<vscale x 8 x i32> splat (i32 1))    ret i32 %x @@ -302,8 +312,7 @@ define i32 @and_poison() {  define i32 @and_poison_scalable_vector() {  ; CHECK-LABEL: @and_poison_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.and.nxv8i32(<vscale x 8 x i32> poison) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 poison  ;    %x = call i32 @llvm.vector.reduce.and.nxv8i32(<vscale x 8 x i32> poison)    ret i32 %x @@ -327,8 +336,7 @@ define i32 @or_0() {  define i32 @or_0_scalable_vector() {  ; CHECK-LABEL: @or_0_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.or.nxv8i32(<vscale x 8 x i32> zeroinitializer) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 0  ;    %x = call i32 @llvm.vector.reduce.or.nxv8i32(<vscale x 8 x i32> zeroinitializer)    ret i32 %x @@ -344,8 +352,7 @@ define i32 @or_1() {  define i32 @or_1_scalable_vector() {  ; CHECK-LABEL: @or_1_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.or.nxv8i32(<vscale x 8 x i32> splat (i32 1)) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 1  ;    %x = call i32 @llvm.vector.reduce.or.nxv8i32(<vscale x 8 x i32> splat (i32 1))    ret i32 %x @@ -404,8 +411,7 @@ define i32 @or_poison() {  define i32 @or_poison_scalable_vector() {  ; CHECK-LABEL: @or_poison_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.or.nxv8i32(<vscale x 8 x i32> poison) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 poison  ;    %x = call i32 @llvm.vector.reduce.or.nxv8i32(<vscale x 8 x i32> poison)    ret i32 %x @@ -429,8 +435,7 @@ define i32 @xor_0() {  define i32 @xor_0_scalable_vector() {  ; CHECK-LABEL: @xor_0_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.xor.nxv8i32(<vscale x 8 x i32> zeroinitializer) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 0  ;    %x = call i32 @llvm.vector.reduce.xor.nxv8i32(<vscale x 8 x i32> zeroinitializer)    ret i32 %x @@ -446,13 +451,21 @@ define i32 @xor_1() {  define i32 @xor_1_scalable_vector() {  ; CHECK-LABEL: @xor_1_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.xor.nxv8i32(<vscale x 8 x i32> splat (i32 1)) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 0  ;    %x = call i32 @llvm.vector.reduce.xor.nxv8i32(<vscale x 8 x i32> splat(i32 1))    ret i32 %x  } +define i32 @xor_1_scalable_vector_lane_count_not_known_even() { +; CHECK-LABEL: @xor_1_scalable_vector_lane_count_not_known_even( +; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.xor.nxv1i32(<vscale x 1 x i32> splat (i32 1)) +; CHECK-NEXT:    ret i32 [[X]] +; +  %x = call i32 @llvm.vector.reduce.xor.nxv8i32(<vscale x 1 x i32> splat(i32 1)) +  ret i32 %x +} +  define i32 @xor_inc() {  ; CHECK-LABEL: @xor_inc(  ; CHECK-NEXT:    ret i32 10 @@ -506,8 +519,7 @@ define i32 @xor_poison() {  define i32 @xor_poison_scalable_vector() {  ; CHECK-LABEL: @xor_poison_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.xor.nxv8i32(<vscale x 8 x i32> poison) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 poison  ;    %x = call i32 @llvm.vector.reduce.xor.nxv8i32(<vscale x 8 x i32> poison)    ret i32 %x @@ -531,8 +543,7 @@ define i32 @smin_0() {  define i32 @smin_0_scalable_vector() {  ; CHECK-LABEL: @smin_0_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.smin.nxv8i32(<vscale x 8 x i32> zeroinitializer) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 0  ;    %x = call i32 @llvm.vector.reduce.smin.nxv8i32(<vscale x 8 x i32> zeroinitializer)    ret i32 %x @@ -548,8 +559,7 @@ define i32 @smin_1() {  define i32 @smin_1_scalable_vector() {  ; CHECK-LABEL: @smin_1_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.smin.nxv8i32(<vscale x 8 x i32> splat (i32 1)) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 1  ;    %x = call i32 @llvm.vector.reduce.smin.nxv8i32(<vscale x 8 x i32> splat(i32 1))    ret i32 %x @@ -608,8 +618,7 @@ define i32 @smin_poison() {  define i32 @smin_poison_scalable_vector() {  ; CHECK-LABEL: @smin_poison_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.smin.nxv8i32(<vscale x 8 x i32> poison) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 poison  ;    %x = call i32 @llvm.vector.reduce.smin.nxv8i32(<vscale x 8 x i32> poison)    ret i32 %x @@ -633,8 +642,7 @@ define i32 @smax_0() {  define i32 @smax_0_scalable_vector() {  ; CHECK-LABEL: @smax_0_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.smax.nxv8i32(<vscale x 8 x i32> zeroinitializer) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 0  ;    %x = call i32 @llvm.vector.reduce.smax.nxv8i32(<vscale x 8 x i32> zeroinitializer)    ret i32 %x @@ -650,8 +658,7 @@ define i32 @smax_1() {  define i32 @smax_1_scalable_vector() {  ; CHECK-LABEL: @smax_1_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.smax.nxv8i32(<vscale x 8 x i32> splat (i32 1)) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 1  ;    %x = call i32 @llvm.vector.reduce.smax.nxv8i32(<vscale x 8 x i32> splat(i32 1))    ret i32 %x @@ -710,8 +717,7 @@ define i32 @smax_poison() {  define i32 @smax_poison_scalable_vector() {  ; CHECK-LABEL: @smax_poison_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.smax.nxv8i32(<vscale x 8 x i32> poison) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 poison  ;    %x = call i32 @llvm.vector.reduce.smax.nxv8i32(<vscale x 8 x i32> poison)    ret i32 %x @@ -735,8 +741,7 @@ define i32 @umin_0() {  define i32 @umin_0_scalable_vector() {  ; CHECK-LABEL: @umin_0_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.umin.nxv8i32(<vscale x 8 x i32> zeroinitializer) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 0  ;    %x = call i32 @llvm.vector.reduce.umin.nxv8i32(<vscale x 8 x i32> zeroinitializer)    ret i32 %x @@ -752,8 +757,7 @@ define i32 @umin_1() {  define i32 @umin_1_scalable_vector() {  ; CHECK-LABEL: @umin_1_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.umin.nxv8i32(<vscale x 8 x i32> splat (i32 1)) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 1  ;    %x = call i32 @llvm.vector.reduce.umin.nxv8i32(<vscale x 8 x i32> splat (i32 1))    ret i32 %x @@ -812,8 +816,7 @@ define i32 @umin_poison() {  define i32 @umin_poison_scalable_vector() {  ; CHECK-LABEL: @umin_poison_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.umin.nxv8i32(<vscale x 8 x i32> poison) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 poison  ;    %x = call i32 @llvm.vector.reduce.umin.nxv8i32(<vscale x 8 x i32> poison)    ret i32 %x @@ -837,8 +840,7 @@ define i32 @umax_0() {  define i32 @umax_0_scalable_vector() {  ; CHECK-LABEL: @umax_0_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.umax.nxv8i32(<vscale x 8 x i32> zeroinitializer) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 0  ;    %x = call i32 @llvm.vector.reduce.umax.nxv8i32(<vscale x 8 x i32> zeroinitializer)    ret i32 %x @@ -854,8 +856,7 @@ define i32 @umax_1() {  define i32 @umax_1_scalable_vector() {  ; CHECK-LABEL: @umax_1_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.umax.nxv8i32(<vscale x 8 x i32> splat (i32 1)) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 1  ;    %x = call i32 @llvm.vector.reduce.umax.nxv8i32(<vscale x 8 x i32> splat(i32 1))    ret i32 %x @@ -914,8 +915,7 @@ define i32 @umax_poison() {  define i32 @umax_poison_scalable_vector() {  ; CHECK-LABEL: @umax_poison_scalable_vector( -; CHECK-NEXT:    [[X:%.*]] = call i32 @llvm.vector.reduce.umax.nxv8i32(<vscale x 8 x i32> poison) -; CHECK-NEXT:    ret i32 [[X]] +; CHECK-NEXT:    ret i32 poison  ;    %x = call i32 @llvm.vector.reduce.umax.nxv8i32(<vscale x 8 x i32> poison)    ret i32 %x diff --git a/llvm/test/Transforms/LoopUnroll/peel-branch-weights-freq.ll b/llvm/test/Transforms/LoopUnroll/branch-weights-freq/peel.ll index 1339afe..1339afe 100644 --- a/llvm/test/Transforms/LoopUnroll/peel-branch-weights-freq.ll +++ b/llvm/test/Transforms/LoopUnroll/branch-weights-freq/peel.ll diff --git a/llvm/test/Transforms/LoopUnroll/branch-weights-freq/unroll-epilog.ll b/llvm/test/Transforms/LoopUnroll/branch-weights-freq/unroll-epilog.ll new file mode 100644 index 0000000..96b31d8 --- /dev/null +++ b/llvm/test/Transforms/LoopUnroll/branch-weights-freq/unroll-epilog.ll @@ -0,0 +1,160 @@ +; Test branch weight metadata, estimated trip count metadata, and block +; frequencies after loop unrolling with an epilogue. + +; ------------------------------------------------------------------------------ +; Define substitutions. +; +; Check original loop body frequency. +; DEFINE: %{bf-fc} = opt %s -S -passes='print<block-freq>' 2>&1 | \ +; DEFINE:   FileCheck %s -check-prefixes +; +; Unroll loops and then check block frequency.  The -implicit-check-not options +; make sure that no additional labels or @f calls show up. +; DEFINE: %{ur-bf} = opt %s -S -passes='loop-unroll,print<block-freq>' 2>&1 +; DEFINE: %{fc} = FileCheck %s \ +; DEFINE:     -implicit-check-not='{{^( *- )?[^ ;]*:}}' \ +; DEFINE:     -implicit-check-not='call void @f' -check-prefixes + +; ------------------------------------------------------------------------------ +; Check various interesting unroll count values relative to the original loop's +; estimated trip count of 11 (e.g., minimum and boundary values). +; +; RUN: %{bf-fc} ALL,ORIG +; RUN: %{ur-bf} -unroll-count=2 -unroll-runtime | %{fc} ALL,UR,UR2 +; RUN: %{ur-bf} -unroll-count=4 -unroll-runtime | %{fc} ALL,UR,UR4 +; RUN: %{ur-bf} -unroll-count=10 -unroll-runtime | %{fc} ALL,UR,UR10 +; RUN: %{ur-bf} -unroll-count=11 -unroll-runtime | %{fc} ALL,UR,UR11 +; RUN: %{ur-bf} -unroll-count=12 -unroll-runtime | %{fc} ALL,UR,UR12 + +; ------------------------------------------------------------------------------ +; Check the iteration frequencies, which, when each is multiplied by the number +; of original loop bodies that execute within it, should sum to almost exactly +; the original loop body frequency. +; +; ALL-LABEL: block-frequency-info: test +; +;      ORIG: - [[ENTRY:.*]]: +;      ORIG: - [[DO_BODY:.*]]: float = 11.0, +;      ORIG: - [[DO_END:.*]]: +; +;        UR: - [[ENTRY:.*]]: +;        UR: - [[ENTRY_NEW:.*]]: +;       UR2: - [[DO_BODY:.*]]: float = 5.2381, +;       UR4: - [[DO_BODY:.*]]: float = 2.3702, +;      UR10: - [[DO_BODY:.*]]: float = 0.6902, +;      UR11: - [[DO_BODY:.*]]: float = 0.59359, +;      UR12: - [[DO_BODY:.*]]: float = 0.5144, +;        UR: - [[DO_END_UNR_LCSSA:.*]]: +;        UR: - [[DO_BODY_EPIL_PREHEADER:.*]]: +;       UR2: - [[DO_BODY_EPIL:.*]]: float = 0.52381, +;       UR4: - [[DO_BODY_EPIL:.*]]: float = 1.5193, +;      UR10: - [[DO_BODY_EPIL:.*]]: float = 4.098, +;      UR11: - [[DO_BODY_EPIL:.*]]: float = 4.4705, +;      UR12: - [[DO_BODY_EPIL:.*]]: float = 4.8272, +;       UR4: - [[DO_END_EPILOG_LCSSA:.*]]: +;      UR10: - [[DO_END_EPILOG_LCSSA:.*]]: +;      UR11: - [[DO_END_EPILOG_LCSSA:.*]]: +;      UR12: - [[DO_END_EPILOG_LCSSA:.*]]: +;        UR: - [[DO_END:.*]]: + +; ------------------------------------------------------------------------------ +; Check the CFGs, including the number of original loop bodies that appear +; within each unrolled iteration. +; +;      UR-LABEL: define void @test(i32 %{{.*}}) { +;            UR: [[ENTRY]]: +;            UR:   br i1 %{{.*}}, label %[[DO_BODY_EPIL_PREHEADER]], label %[[ENTRY_NEW]], !prof ![[#PROF_UR_GUARD:]]{{$}} +;            UR: [[ENTRY_NEW]]: +;            UR:   br label %[[DO_BODY]] +;            UR: [[DO_BODY]]: +;   UR2-COUNT-2:   call void @f +;   UR4-COUNT-4:   call void @f +; UR10-COUNT-10:   call void @f +; UR11-COUNT-11:   call void @f +; UR12-COUNT-12:   call void @f +;            UR:   br i1 %{{.*}}, label %[[DO_END_UNR_LCSSA]], label %[[DO_BODY]], !prof ![[#PROF_UR_LATCH:]], !llvm.loop ![[#LOOP_UR_LATCH:]]{{$}} +;            UR: [[DO_END_UNR_LCSSA]]: +;            UR:   br i1 %{{.*}}, label %[[DO_BODY_EPIL_PREHEADER]], label %[[DO_END:.*]], !prof ![[#PROF_RM_GUARD:]]{{$}} +;            UR: [[DO_BODY_EPIL_PREHEADER]]: +;            UR:   br label %[[DO_BODY_EPIL]] +;            UR: [[DO_BODY_EPIL]]: +;            UR:   call void @f +;           UR4:   br i1 %{{.*}}, label %[[DO_BODY_EPIL]], label %[[DO_END_EPILOG_LCSSA]], !prof ![[#PROF_RM_LATCH:]], !llvm.loop ![[#LOOP_RM_LATCH:]]{{$}} +;          UR10:   br i1 %{{.*}}, label %[[DO_BODY_EPIL]], label %[[DO_END_EPILOG_LCSSA]], !prof ![[#PROF_RM_LATCH:]], !llvm.loop ![[#LOOP_RM_LATCH:]]{{$}} +;          UR11:   br i1 %{{.*}}, label %[[DO_BODY_EPIL]], label %[[DO_END_EPILOG_LCSSA]], !prof ![[#PROF_RM_LATCH:]], !llvm.loop ![[#LOOP_RM_LATCH:]]{{$}} +;          UR12:   br i1 %{{.*}}, label %[[DO_BODY_EPIL]], label %[[DO_END_EPILOG_LCSSA]], !prof ![[#PROF_RM_LATCH:]], !llvm.loop ![[#LOOP_RM_LATCH:]]{{$}} +;           UR4: [[DO_END_EPILOG_LCSSA]]: +;          UR10: [[DO_END_EPILOG_LCSSA]]: +;          UR11: [[DO_END_EPILOG_LCSSA]]: +;          UR12: [[DO_END_EPILOG_LCSSA]]: +;            UR:   br label %[[DO_END]] +;            UR: [[DO_END]]: +;            UR:   ret void + +declare void @f(i32) + +define void @test(i32 %n) { +entry: +  br label %do.body + +do.body: +  %i = phi i32 [ 0, %entry ], [ %inc, %do.body ] +  %inc = add i32 %i, 1 +  call void @f(i32 %i) +  %c = icmp sge i32 %inc, %n +  br i1 %c, label %do.end, label %do.body, !prof !0 + +do.end: +  ret void +} + +!0 = !{!"branch_weights", i32 1, i32 10} + +; ------------------------------------------------------------------------------ +; Check branch weight metadata and estimated trip count metadata. +; +;  UR2: ![[#PROF_UR_GUARD]] = !{!"branch_weights", i32 195225786, i32 1952257862} +;  UR4: ![[#PROF_UR_GUARD]] = !{!"branch_weights", i32 534047398, i32 1613436250} +; UR10: ![[#PROF_UR_GUARD]] = !{!"branch_weights", i32 1236740947, i32 910742701} +; UR11: ![[#PROF_UR_GUARD]] = !{!"branch_weights", i32 1319535738, i32 827947910} +; UR12: ![[#PROF_UR_GUARD]] = !{!"branch_weights", i32 1394803730, i32 752679918} +; +;  UR2: ![[#PROF_UR_LATCH]] = !{!"branch_weights", i32 372703773, i32 1774779875} +;  UR4: ![[#PROF_UR_LATCH]] = !{!"branch_weights", i32 680723421, i32 1466760227} +; UR10: ![[#PROF_UR_LATCH]] = !{!"branch_weights", i32 1319535738, i32 827947910} +; UR11: ![[#PROF_UR_LATCH]] = !{!"branch_weights", i32 1394803730, i32 752679918} +; UR12: ![[#PROF_UR_LATCH]] = !{!"branch_weights", i32 1463229177, i32 684254471} +; +;  UR2: ![[#LOOP_UR_LATCH]] = distinct !{![[#LOOP_UR_LATCH]], ![[#LOOP_UR_TC:]], ![[#DISABLE:]]} +;  UR4: ![[#LOOP_UR_LATCH]] = distinct !{![[#LOOP_UR_LATCH]], ![[#LOOP_UR_TC:]], ![[#DISABLE:]]} +; UR10: ![[#LOOP_UR_LATCH]] = distinct !{![[#LOOP_UR_LATCH]], ![[#LOOP_UR_TC:]], ![[#DISABLE:]]} +; UR11: ![[#LOOP_UR_LATCH]] = distinct !{![[#LOOP_UR_LATCH]], ![[#LOOP_UR_TC:]], ![[#DISABLE:]]} +; UR12: ![[#LOOP_UR_LATCH]] = distinct !{![[#LOOP_UR_LATCH]], ![[#LOOP_UR_TC:]], ![[#DISABLE:]]} +; +;  UR2: ![[#LOOP_UR_TC]] = !{!"llvm.loop.estimated_trip_count", i32 5} +;  UR4: ![[#LOOP_UR_TC]] = !{!"llvm.loop.estimated_trip_count", i32 2} +; UR10: ![[#LOOP_UR_TC]] = !{!"llvm.loop.estimated_trip_count", i32 1} +; UR11: ![[#LOOP_UR_TC]] = !{!"llvm.loop.estimated_trip_count", i32 1} +; UR12: ![[#LOOP_UR_TC]] = !{!"llvm.loop.estimated_trip_count", i32 0} +;   UR: ![[#DISABLE]] = !{!"llvm.loop.unroll.disable"} +; +;  UR2: ![[#PROF_RM_GUARD]] = !{!"branch_weights", i32 1022611260, i32 1124872388} +;  UR4: ![[#PROF_RM_GUARD]] = !{!"branch_weights", i32 1531603292, i32 615880356} +; UR10: ![[#PROF_RM_GUARD]] = !{!"branch_weights", i32 1829762672, i32 317720976} +; UR11: ![[#PROF_RM_GUARD]] = !{!"branch_weights", i32 1846907894, i32 300575754} +; UR12: ![[#PROF_RM_GUARD]] = !{!"branch_weights", i32 1860963812, i32 286519836} +; +;  UR4: ![[#PROF_RM_LATCH]] = !{!"branch_weights", i32 1038564635, i32 1108919013} +; UR10: ![[#PROF_RM_LATCH]] = !{!"branch_weights", i32 1656332913, i32 491150735} +; UR11: ![[#PROF_RM_LATCH]] = !{!"branch_weights", i32 1693034047, i32 454449601} +; UR12: ![[#PROF_RM_LATCH]] = !{!"branch_weights", i32 1723419551, i32 424064097} + +;  UR4: ![[#LOOP_RM_LATCH]] = distinct !{![[#LOOP_RM_LATCH]], ![[#LOOP_RM_TC:]], ![[#DISABLE:]]} +; UR10: ![[#LOOP_RM_LATCH]] = distinct !{![[#LOOP_RM_LATCH]], ![[#LOOP_UR_TC:]], ![[#DISABLE:]]} +; UR11: ![[#LOOP_RM_LATCH]] = distinct !{![[#LOOP_RM_LATCH]], ![[#LOOP_RM_TC:]], ![[#DISABLE:]]} +; UR12: ![[#LOOP_RM_LATCH]] = distinct !{![[#LOOP_RM_LATCH]], ![[#LOOP_RM_TC:]], ![[#DISABLE:]]} +; +;  UR4: ![[#LOOP_RM_TC]] = !{!"llvm.loop.estimated_trip_count", i32 3} +; For UR10, llvm.loop.estimated_trip_count is the same for both loops. +; UR11: ![[#LOOP_RM_TC]] = !{!"llvm.loop.estimated_trip_count", i32 0} +; UR12: ![[#LOOP_RM_TC]] = !{!"llvm.loop.estimated_trip_count", i32 11} diff --git a/llvm/test/Transforms/LoopUnroll/branch-weights-freq/unroll-partial.ll b/llvm/test/Transforms/LoopUnroll/branch-weights-freq/unroll-partial.ll new file mode 100644 index 0000000..cde9d46 --- /dev/null +++ b/llvm/test/Transforms/LoopUnroll/branch-weights-freq/unroll-partial.ll @@ -0,0 +1,68 @@ +; Test branch weight metadata, estimated trip count metadata, and block +; frequencies after partial loop unrolling without -unroll-runtime. + +; RUN: opt < %s -S -passes='print<block-freq>' 2>&1 | \ +; RUN:   FileCheck -check-prefix=CHECK %s + +; The -implicit-check-not options make sure that no additional labels or calls +; to @f show up. +; RUN: opt < %s -S -passes='loop-unroll,print<block-freq>' \ +; RUN:     -unroll-count=4 2>&1 | \ +; RUN:   FileCheck %s -check-prefix=CHECK-UR \ +; RUN:       -implicit-check-not='{{^( *- )?[^ ;]*:}}' \ +; RUN:       -implicit-check-not='call void @f' + +; CHECK: block-frequency-info: test +; CHECK: do.body: float = 10.0, + +; The sum should still be ~10. +; +; CHECK-UR: block-frequency-info: test +; CHECK-UR: - [[ENTRY:.*]]: +; CHECK-UR: - [[DO_BODY:.*]]: float = 2.9078, +; CHECK-UR: - [[DO_BODY_1:.*]]: float = 2.617, +; CHECK-UR: - [[DO_BODY_2:.*]]: float = 2.3553, +; CHECK-UR: - [[DO_BODY_3:.*]]: float = 2.1198, +; CHECK-UR: - [[DO_END:.*]]: + +declare void @f(i32) + +define void @test(i32 %n) { +; CHECK-UR-LABEL: define void @test(i32 %{{.*}}) { +;       CHECK-UR: [[ENTRY]]: +;       CHECK-UR:   br label %[[DO_BODY]] +;       CHECK-UR: [[DO_BODY]]: +;       CHECK-UR:   call void @f +;       CHECK-UR:   br i1 %{{.*}}, label %[[DO_END]], label %[[DO_BODY_1]], !prof ![[#PROF:]] +;       CHECK-UR: [[DO_BODY_1]]: +;       CHECK-UR:   call void @f +;       CHECK-UR:   br i1 %{{.*}}, label %[[DO_END]], label %[[DO_BODY_2]], !prof ![[#PROF]] +;       CHECK-UR: [[DO_BODY_2]]: +;       CHECK-UR:   call void @f +;       CHECK-UR:   br i1 %{{.*}}, label %[[DO_END]], label %[[DO_BODY_3]], !prof ![[#PROF]] +;       CHECK-UR: [[DO_BODY_3]]: +;       CHECK-UR:   call void @f +;       CHECK-UR:   br i1 %{{.*}}, label %[[DO_END]], label %[[DO_BODY]], !prof ![[#PROF]], !llvm.loop ![[#LOOP_UR_LATCH:]] +;       CHECK-UR: [[DO_END]]: +;       CHECK-UR:   ret void + +entry: +  br label %do.body + +do.body: +  %i = phi i32 [ 0, %entry ], [ %inc, %do.body ] +  %inc = add i32 %i, 1 +  call void @f(i32 %i) +  %c = icmp sge i32 %inc, %n +  br i1 %c, label %do.end, label %do.body, !prof !0 + +do.end: +  ret void +} + +!0 = !{!"branch_weights", i32 1, i32 9} + +; CHECK-UR: ![[#PROF]] = !{!"branch_weights", i32 1, i32 9} +; CHECK-UR: ![[#LOOP_UR_LATCH]] = distinct !{![[#LOOP_UR_LATCH]], ![[#LOOP_UR_TC:]], ![[#DISABLE:]]} +; CHECK-UR: ![[#LOOP_UR_TC]] = !{!"llvm.loop.estimated_trip_count", i32 3} +; CHECK-UR: ![[#DISABLE]] = !{!"llvm.loop.unroll.disable"} diff --git a/llvm/test/Transforms/LoopUnroll/runtime-exit-phi-scev-invalidation.ll b/llvm/test/Transforms/LoopUnroll/runtime-exit-phi-scev-invalidation.ll index 0c52b5a0..0473601 100644 --- a/llvm/test/Transforms/LoopUnroll/runtime-exit-phi-scev-invalidation.ll +++ b/llvm/test/Transforms/LoopUnroll/runtime-exit-phi-scev-invalidation.ll @@ -188,7 +188,7 @@ define void @pr56286(i64 %x, ptr %src, ptr %dst, ptr %ptr.src) !prof !0 {  ; CHECK-NEXT:    [[L_1_LCSSA_UNR:%.*]] = phi i32 [ poison, [[OUTER_HEADER]] ], [ [[L_1_LCSSA_UNR_PH]], [[INNER_1_HEADER_PROL_LOOPEXIT_UNR_LCSSA]] ]  ; CHECK-NEXT:    [[INNER_1_IV_UNR:%.*]] = phi i64 [ [[X]], [[OUTER_HEADER]] ], [ [[INNER_1_IV_UNR_PH]], [[INNER_1_HEADER_PROL_LOOPEXIT_UNR_LCSSA]] ]  ; CHECK-NEXT:    [[TMP4:%.*]] = icmp ult i64 [[TMP3]], 7 -; CHECK-NEXT:    br i1 [[TMP4]], label [[OUTER_MIDDLE:%.*]], label [[OUTER_HEADER_NEW:%.*]], !prof [[PROF3]] +; CHECK-NEXT:    br i1 [[TMP4]], label [[OUTER_MIDDLE:%.*]], label [[OUTER_HEADER_NEW:%.*]], !prof [[PROF6:![0-9]+]]  ; CHECK:       outer.header.new:  ; CHECK-NEXT:    br label [[INNER_1_HEADER:%.*]]  ; CHECK:       inner.1.header: @@ -232,7 +232,7 @@ define void @pr56286(i64 %x, ptr %src, ptr %dst, ptr %ptr.src) !prof !0 {  ; CHECK-NEXT:    store i32 [[L_1_7]], ptr [[DST]], align 8  ; CHECK-NEXT:    [[INNER_1_IV_NEXT_7]] = add i64 [[INNER_1_IV]], 8  ; CHECK-NEXT:    [[CMP_2_7:%.*]] = icmp sgt i64 [[INNER_1_IV_NEXT_6]], 0 -; CHECK-NEXT:    br i1 [[CMP_2_7]], label [[OUTER_MIDDLE_UNR_LCSSA:%.*]], label [[INNER_1_HEADER]], !prof [[PROF6:![0-9]+]], !llvm.loop [[LOOP7:![0-9]+]] +; CHECK-NEXT:    br i1 [[CMP_2_7]], label [[OUTER_MIDDLE_UNR_LCSSA:%.*]], label [[INNER_1_HEADER]], !prof [[PROF7:![0-9]+]], !llvm.loop [[LOOP8:![0-9]+]]  ; CHECK:       outer.middle.unr-lcssa:  ; CHECK-NEXT:    [[L_1_LCSSA_PH:%.*]] = phi i32 [ [[L_1_7]], [[INNER_1_LATCH_7]] ]  ; CHECK-NEXT:    br label [[OUTER_MIDDLE]] diff --git a/llvm/test/Transforms/LoopUnroll/runtime-loop-branchweight.ll b/llvm/test/Transforms/LoopUnroll/runtime-loop-branchweight.ll index 2617199..2f8f98d 100644 --- a/llvm/test/Transforms/LoopUnroll/runtime-loop-branchweight.ll +++ b/llvm/test/Transforms/LoopUnroll/runtime-loop-branchweight.ll @@ -2,12 +2,24 @@  ;; Check that the remainder loop is properly assigned a branch weight for its latch branch.  ; CHECK-LABEL: @test( -; CHECK-LABEL: for.body: -; CHECK: br i1 [[COND1:%.*]], label %for.end.loopexit.unr-lcssa, label %for.body, !prof ![[#PROF:]], !llvm.loop ![[#LOOP:]] -; CHECK-LABEL: for.body.epil: -; CHECK: br i1 [[COND2:%.*]], label  %for.body.epil, label %for.end.loopexit.epilog-lcssa, !prof ![[#PROF2:]], !llvm.loop ![[#LOOP2:]] -; CHECK: ![[#PROF]] = !{!"branch_weights", i32 1, i32 2499} -; CHECK: ![[#PROF2]] = !{!"branch_weights", i32 1, i32 1} +; CHECK-LABEL: entry: +;       CHECK: [[FOR_BODY_PREHEADER:.*]]: +;       CHECK:   br i1 %{{.*}}, label %[[FOR_BODY_EPIL_PREHEADER:.*]], label %[[FOR_BODY_PREHEADER_NEW:.*]], !prof ![[#PROF_UR_GUARD:]] +;       CHECK: [[FOR_BODY_PREHEADER_NEW]]: +;       CHECK:   br label %for.body +;       CHECK: for.body: +;       CHECK:   %add = add +;       CHECK:   %add.1 = add +;       CHECK:   %add.2 = add +;       CHECK:   %add.3 = add +;   CHECK-NOT:   %add.4 = add +;       CHECK:   br i1 %{{.*}}, label %[[FOR_END_LOOPEXIT_UNR_LCSSA:.*]], label %for.body, !prof ![[#PROF_UR_LATCH:]], !llvm.loop ![[#LOOP_UR_LATCH:]] +;       CHECK: [[FOR_END_LOOPEXIT_UNR_LCSSA]]: +;       CHECK:   br i1 %{{.*}}, label %[[FOR_BODY_EPIL_PREHEADER]], label %[[FOR_END_LOOPEXIT:.*]], !prof ![[#PROF_RM_GUARD:]] +;       CHECK: [[FOR_BODY_EPIL_PREHEADER]]: +;       CHECK:   br label %[[FOR_BODY_EPIL:.*]] +;       CHECK: [[FOR_BODY_EPIL]]: +;       CHECK:   br i1 {{.*}}, label %[[FOR_BODY_EPIL]], label %[[FOR_END_LOOPEXIT_EPILOG_LCSSA:.*]], !prof ![[#PROF_RM_LATCH:]], !llvm.loop ![[#LOOP_RM_LATCH:]]  define i3 @test(ptr %a, i3 %n) {  entry: @@ -31,3 +43,37 @@ for.end:  }  !0 = !{!"branch_weights", i32 1, i32 9999} + +; Original loop probability: p = 9999/(1+9999) = 0.9999 +; Original estimated trip count: (1+9999)/1 = 10000 +; Unroll count: 4 + +; Probability of >=3 iterations after first: p^3 = 0.9970003 =~ +; 2146839468 / (644180 + 2146839468). +; CHECK: ![[#PROF_UR_GUARD]] = !{!"branch_weights", i32 644180, i32 2146839468} + +; Probability of >=4 more iterations: p^4 = 0.99960006 =~ +; 2146624784 / (858864 + 2146624784). +; CHECK: ![[#PROF_UR_LATCH]] = !{!"branch_weights", i32 858864, i32 2146624784} + +; 10000//4 = 2500 +; CHECK: ![[#LOOP_UR_LATCH]] = distinct !{![[#LOOP_UR_LATCH]], ![[#LOOP_UR_TC:]], ![[#DISABLE:]]} +; CHECK: ![[#LOOP_UR_TC]] = !{!"llvm.loop.estimated_trip_count", i32 2500} +; +; CHECK: ![[#DISABLE]] = !{!"llvm.loop.unroll.disable"} + +; Probability of 1 to 3 more of 3 more remainder iterations: +; (p-p^4)/(1-p^4) = 0.749962497 =~ 1610532724 / (1610532724 + 536950924). +; CHECK: ![[#PROF_RM_GUARD]] = !{!"branch_weights", i32 1610532724, i32 536950924} + +; Frequency of first remainder iter:  r1 =                      1 +; Frequency of second remainder iter: r2 = r1*(p-p^3)/(1-p^3) = 0.666633331 +; Frequency of third remainder iter:  r3 = r2*(p-p^2)/(1-p^2) = 0.333299999 +; Solve for loop probability that produces that frequency: f = 1/(1-p') => +; p' = 1-1/f = 1-1/(r1+r2+r3) = 0.499983332 =~ +; 1073706403 / (1073706403 + 1073777245). +; CHECK: ![[#PROF_RM_LATCH]] = !{!"branch_weights", i32 1073706403, i32 1073777245} + +; 10000%4 = 0 +; CHECK: ![[#LOOP_RM_LATCH]] = distinct !{![[#LOOP_RM_LATCH]], ![[#LOOP_RM_TC:]], ![[#DISABLE:]]} +; CHECK: ![[#LOOP_RM_TC]] = !{!"llvm.loop.estimated_trip_count", i32 0} diff --git a/llvm/test/Transforms/LoopUnroll/runtime-loop.ll b/llvm/test/Transforms/LoopUnroll/runtime-loop.ll index 492de06..ec7aba4 100644 --- a/llvm/test/Transforms/LoopUnroll/runtime-loop.ll +++ b/llvm/test/Transforms/LoopUnroll/runtime-loop.ll @@ -295,11 +295,12 @@ exit2.loopexit:  ; COMMON-LABEL: {{^}}!0 =  ; EPILOG: [[EPILOG_PROF_0]] = !{!"branch_weights", i32 1, i32 11} -; EPILOG: [[EPILOG_PROF_1]] = !{!"branch_weights", i32 1, i32 127} -; EPILOG: [[EPILOG_PROF_2]] = !{!"branch_weights", i32 1, i32 7} -; EPILOG: [[EPILOG_PROF_3]] = !{!"branch_weights", i32 3, i32 1} +; EPILOG: [[EPILOG_PROF_1]] = !{!"branch_weights", i32 326124004, i32 1821359644} +; EPILOG: [[EPILOG_PROF_2]] = !{!"branch_weights", i32 1856428066, i32 291055582} +; EPILOG: [[EPILOG_PROF_3]] = !{!"branch_weights", i32 1597681585, i32 549802063} -; EPILOG: [[EPILOG_LOOP]] = distinct !{[[EPILOG_LOOP]], [[EPILOG_LOOP_1:![0-9]+]]} +; EPILOG: [[EPILOG_LOOP]] = distinct !{[[EPILOG_LOOP]], [[EPILOG_TC:![0-9]+]], [[EPILOG_LOOP_1:![0-9]+]]} +; EPILOG: [[EPILOG_TC]] = !{!"llvm.loop.estimated_trip_count", i32 3}  ; EPILOG: [[EPILOG_LOOP_1]] = !{!"llvm.loop.unroll.disable"}  ; PROLOG: [[PROLOG_PROF_0]] = !{!"branch_weights", i32 1, i32 11} diff --git a/llvm/test/Transforms/LoopUnroll/unroll-heuristics-pgo.ll b/llvm/test/Transforms/LoopUnroll/unroll-heuristics-pgo.ll index 611ee5f..02f5bf9 100644 --- a/llvm/test/Transforms/LoopUnroll/unroll-heuristics-pgo.ll +++ b/llvm/test/Transforms/LoopUnroll/unroll-heuristics-pgo.ll @@ -3,14 +3,27 @@  @known_constant = internal unnamed_addr constant [9 x i32] [i32 0, i32 -1, i32 0, i32 -1, i32 5, i32 -1, i32 0, i32 -1, i32 0], align 16  ; CHECK-LABEL: @bar_prof -; CHECK: loop: -; CHECK:   %mul = mul -; CHECK:   %mul.1 = mul -; CHECK:   %mul.2 = mul -; CHECK:   %mul.3 = mul -; CHECK:   br i1 %niter.ncmp.7, label %loop.end.unr-lcssa, label %loop, !prof [[PROF0:![0-9]+]] -; CHECK: loop.epil: -; CHECK:   br i1 %epil.iter.cmp, label %loop.epil, label %loop.end.epilog-lcssa, !prof [[PROF1:![0-9]+]], !llvm.loop {{![0-9]+}} +;       CHECK: entry: +;       CHECK:   br i1 %{{.*}}, label %[[LOOP_EPIL_PREHEADER:.*]], label %[[ENTRY_NEW:.*]], !prof ![[#PROF_UR_GUARD:]] +;       CHECK: [[ENTRY_NEW]]: +;       CHECK:   br label %loop +;       CHECK: loop: +;       CHECK:   %mul = mul +;       CHECK:   %mul.1 = mul +;       CHECK:   %mul.2 = mul +;       CHECK:   %mul.3 = mul +;       CHECK:   %mul.4 = mul +;       CHECK:   %mul.5 = mul +;       CHECK:   %mul.6 = mul +;       CHECK:   %mul.7 = mul +;   CHECK-NOT:   %mul.8 = mul +;       CHECK:   br i1 %{{.*}}, label %[[LOOP_END_UNR_LCSSA:.*]], label %loop, !prof ![[#PROF_UR_LATCH:]], !llvm.loop ![[#LOOP_UR_LATCH:]] +;       CHECK: [[LOOP_END_UNR_LCSSA]]: +;       CHECK:   br i1 %{{.*}}, label %[[LOOP_EPIL_PREHEADER]], label %loop.end, !prof ![[#PROF_RM_GUARD:]] +;       CHECK: [[LOOP_EPIL_PREHEADER]]: +;       CHECK:   br label %[[LOOP_EPIL:.*]] +;       CHECK: [[LOOP_EPIL]]: +;       CHECK:   br i1 %{{.*}}, label %[[LOOP_EPIL]], label %[[LOOP_END_EPILOG_LCSSA:.*]], !prof ![[#PROF_RM_LATCH:]], !llvm.loop ![[#LOOP_RM_LATCH:]]  define i32 @bar_prof(ptr noalias nocapture readonly %src, i64 %c) !prof !1 {  entry:    br label %loop @@ -60,5 +73,38 @@ loop.end:  !1 = !{!"function_entry_count", i64 1}  !2 = !{!"branch_weights", i32 1, i32 1000} -; CHECK: [[PROF0]] = !{!"branch_weights", i32 1, i32 124} -; CHECK: [[PROF1]] = !{!"branch_weights", i32 3, i32 1} +; Original loop probability: p = 1000/(1+1000) = 0.999000999 +; Original estimated trip count: (1+1000)/1 = 1001 +; Unroll count: 8 + +; Probability of >=7 iterations after first: p^7 = 0.993027916 =~ +; 2132511214 / (14972434 + 2132511214). +; CHECK: ![[#PROF_UR_GUARD]] = !{!"branch_weights", i32 14972434, i32 2132511214} + +; Probability of >=8 more iterations: p^8 = 0.99203588 =~ +; 2130380833 / (17102815 + 2130380833). +; CHECK: ![[#PROF_UR_LATCH]] = !{!"branch_weights", i32 17102815, i32 2130380833} + +; 1001//8 = 125 +; CHECK: ![[#LOOP_UR_LATCH]] = distinct !{![[#LOOP_UR_LATCH]], ![[#LOOP_UR_TC:]]} +; CHECK: ![[#LOOP_UR_TC]] = !{!"llvm.loop.estimated_trip_count", i32 125} + +; Probability of 1 to 7 more of 7 more remainder iterations: +; (p-p^8)/(1-p^8) = 0.874562282 =~ 1878108210 / (1878108210 + 269375438). +; CHECK: ![[#PROF_RM_GUARD]] = !{!"branch_weights", i32 1878108210, i32 269375438} + +; Frequency of first remainder iter:   r1 =                      1 +; Frequency of second remainder iter:  r2 = r1*(p-p^7)/(1-p^7) = 0.856714143 +; Frequency of third remainder iter:   r3 = r2*(p-p^6)/(1-p^6) = 0.713571429 +; Frequency of fourth remainder iter:  r4 = r2*(p-p^5)/(1-p^5) = 0.570571715 +; Frequency of fifth remainder iter:   r5 = r2*(p-p^4)/(1-p^4) = 0.427714858 +; Frequency of sixth remainder iter:   r6 = r2*(p-p^3)/(1-p^3) = 0.285000715 +; Frequency of seventh remainder iter: r7 = r2*(p-p^2)/(1-p^2) = 0.142429143 +; Solve for loop probability that produces that frequency: f = 1/(1-p') => +; p' = 1-1/f = 1-1/(r1+r2+r3+r4+r5+r6+r7) = 0.749749875 =~ +; 1610075606 / (1610075606 + 537408042). +; CHECK: ![[#PROF_RM_LATCH]] = !{!"branch_weights", i32 1610075606, i32 537408042} + +; Remainder estimated trip count: 1001%8 = 1 +; CHECK: ![[#LOOP_RM_LATCH]] = distinct !{![[#LOOP_RM_LATCH]], ![[#LOOP_RM_TC:]], ![[#DISABLE:]]} +; CHECK: ![[#LOOP_RM_TC]] = !{!"llvm.loop.estimated_trip_count", i32 1} diff --git a/llvm/test/Transforms/LoopVectorize/AArch64/replicating-load-store-costs.ll b/llvm/test/Transforms/LoopVectorize/AArch64/replicating-load-store-costs.ll index 7f34513..68cfc65 100644 --- a/llvm/test/Transforms/LoopVectorize/AArch64/replicating-load-store-costs.ll +++ b/llvm/test/Transforms/LoopVectorize/AArch64/replicating-load-store-costs.ll @@ -660,6 +660,114 @@ exit:    ret i32 %red  } + +define i32 @test_or_reduction_with_stride_2(i32 %scale, ptr %src) { +; CHECK-LABEL: define i32 @test_or_reduction_with_stride_2( +; CHECK-SAME: i32 [[SCALE:%.*]], ptr [[SRC:%.*]]) { +; CHECK-NEXT:  [[ENTRY:.*:]] +; CHECK-NEXT:    br label %[[VECTOR_PH:.*]] +; CHECK:       [[VECTOR_PH]]: +; CHECK-NEXT:    [[BROADCAST_SPLATINSERT:%.*]] = insertelement <16 x i32> poison, i32 [[SCALE]], i64 0 +; CHECK-NEXT:    [[BROADCAST_SPLAT:%.*]] = shufflevector <16 x i32> [[BROADCAST_SPLATINSERT]], <16 x i32> poison, <16 x i32> zeroinitializer +; CHECK-NEXT:    br label %[[VECTOR_BODY:.*]] +; CHECK:       [[VECTOR_BODY]]: +; CHECK-NEXT:    [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ] +; CHECK-NEXT:    [[VEC_PHI:%.*]] = phi <16 x i32> [ zeroinitializer, %[[VECTOR_PH]] ], [ [[TMP66:%.*]], %[[VECTOR_BODY]] ] +; CHECK-NEXT:    [[OFFSET_IDX:%.*]] = mul i64 [[INDEX]], 2 +; CHECK-NEXT:    [[TMP0:%.*]] = add i64 [[OFFSET_IDX]], 0 +; CHECK-NEXT:    [[TMP1:%.*]] = add i64 [[OFFSET_IDX]], 2 +; CHECK-NEXT:    [[TMP2:%.*]] = add i64 [[OFFSET_IDX]], 4 +; CHECK-NEXT:    [[TMP3:%.*]] = add i64 [[OFFSET_IDX]], 6 +; CHECK-NEXT:    [[TMP4:%.*]] = add i64 [[OFFSET_IDX]], 8 +; CHECK-NEXT:    [[TMP5:%.*]] = add i64 [[OFFSET_IDX]], 10 +; CHECK-NEXT:    [[TMP6:%.*]] = add i64 [[OFFSET_IDX]], 12 +; CHECK-NEXT:    [[TMP7:%.*]] = add i64 [[OFFSET_IDX]], 14 +; CHECK-NEXT:    [[TMP8:%.*]] = add i64 [[OFFSET_IDX]], 16 +; CHECK-NEXT:    [[TMP9:%.*]] = add i64 [[OFFSET_IDX]], 18 +; CHECK-NEXT:    [[TMP10:%.*]] = add i64 [[OFFSET_IDX]], 20 +; CHECK-NEXT:    [[TMP11:%.*]] = add i64 [[OFFSET_IDX]], 22 +; CHECK-NEXT:    [[TMP12:%.*]] = add i64 [[OFFSET_IDX]], 24 +; CHECK-NEXT:    [[TMP13:%.*]] = add i64 [[OFFSET_IDX]], 26 +; CHECK-NEXT:    [[TMP14:%.*]] = add i64 [[OFFSET_IDX]], 28 +; CHECK-NEXT:    [[TMP15:%.*]] = add i64 [[OFFSET_IDX]], 30 +; CHECK-NEXT:    [[TMP16:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP0]] +; CHECK-NEXT:    [[TMP17:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP1]] +; CHECK-NEXT:    [[TMP18:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP2]] +; CHECK-NEXT:    [[TMP19:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP3]] +; CHECK-NEXT:    [[TMP20:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP4]] +; CHECK-NEXT:    [[TMP21:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP5]] +; CHECK-NEXT:    [[TMP22:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP6]] +; CHECK-NEXT:    [[TMP23:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP7]] +; CHECK-NEXT:    [[TMP24:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP8]] +; CHECK-NEXT:    [[TMP25:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP9]] +; CHECK-NEXT:    [[TMP26:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP10]] +; CHECK-NEXT:    [[TMP27:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP11]] +; CHECK-NEXT:    [[TMP28:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP12]] +; CHECK-NEXT:    [[TMP29:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP13]] +; CHECK-NEXT:    [[TMP30:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP14]] +; CHECK-NEXT:    [[TMP31:%.*]] = getelementptr [32 x i8], ptr [[SRC]], i64 [[TMP15]] +; CHECK-NEXT:    [[TMP32:%.*]] = load i8, ptr [[TMP16]], align 1 +; CHECK-NEXT:    [[TMP33:%.*]] = load i8, ptr [[TMP17]], align 1 +; CHECK-NEXT:    [[TMP34:%.*]] = load i8, ptr [[TMP18]], align 1 +; CHECK-NEXT:    [[TMP35:%.*]] = load i8, ptr [[TMP19]], align 1 +; CHECK-NEXT:    [[TMP36:%.*]] = load i8, ptr [[TMP20]], align 1 +; CHECK-NEXT:    [[TMP37:%.*]] = load i8, ptr [[TMP21]], align 1 +; CHECK-NEXT:    [[TMP38:%.*]] = load i8, ptr [[TMP22]], align 1 +; CHECK-NEXT:    [[TMP39:%.*]] = load i8, ptr [[TMP23]], align 1 +; CHECK-NEXT:    [[TMP40:%.*]] = load i8, ptr [[TMP24]], align 1 +; CHECK-NEXT:    [[TMP41:%.*]] = load i8, ptr [[TMP25]], align 1 +; CHECK-NEXT:    [[TMP42:%.*]] = load i8, ptr [[TMP26]], align 1 +; CHECK-NEXT:    [[TMP43:%.*]] = load i8, ptr [[TMP27]], align 1 +; CHECK-NEXT:    [[TMP44:%.*]] = load i8, ptr [[TMP28]], align 1 +; CHECK-NEXT:    [[TMP45:%.*]] = load i8, ptr [[TMP29]], align 1 +; CHECK-NEXT:    [[TMP46:%.*]] = load i8, ptr [[TMP30]], align 1 +; CHECK-NEXT:    [[TMP47:%.*]] = load i8, ptr [[TMP31]], align 1 +; CHECK-NEXT:    [[TMP48:%.*]] = insertelement <16 x i8> poison, i8 [[TMP32]], i32 0 +; CHECK-NEXT:    [[TMP49:%.*]] = insertelement <16 x i8> [[TMP48]], i8 [[TMP33]], i32 1 +; CHECK-NEXT:    [[TMP50:%.*]] = insertelement <16 x i8> [[TMP49]], i8 [[TMP34]], i32 2 +; CHECK-NEXT:    [[TMP51:%.*]] = insertelement <16 x i8> [[TMP50]], i8 [[TMP35]], i32 3 +; CHECK-NEXT:    [[TMP52:%.*]] = insertelement <16 x i8> [[TMP51]], i8 [[TMP36]], i32 4 +; CHECK-NEXT:    [[TMP53:%.*]] = insertelement <16 x i8> [[TMP52]], i8 [[TMP37]], i32 5 +; CHECK-NEXT:    [[TMP54:%.*]] = insertelement <16 x i8> [[TMP53]], i8 [[TMP38]], i32 6 +; CHECK-NEXT:    [[TMP55:%.*]] = insertelement <16 x i8> [[TMP54]], i8 [[TMP39]], i32 7 +; CHECK-NEXT:    [[TMP56:%.*]] = insertelement <16 x i8> [[TMP55]], i8 [[TMP40]], i32 8 +; CHECK-NEXT:    [[TMP57:%.*]] = insertelement <16 x i8> [[TMP56]], i8 [[TMP41]], i32 9 +; CHECK-NEXT:    [[TMP58:%.*]] = insertelement <16 x i8> [[TMP57]], i8 [[TMP42]], i32 10 +; CHECK-NEXT:    [[TMP59:%.*]] = insertelement <16 x i8> [[TMP58]], i8 [[TMP43]], i32 11 +; CHECK-NEXT:    [[TMP60:%.*]] = insertelement <16 x i8> [[TMP59]], i8 [[TMP44]], i32 12 +; CHECK-NEXT:    [[TMP61:%.*]] = insertelement <16 x i8> [[TMP60]], i8 [[TMP45]], i32 13 +; CHECK-NEXT:    [[TMP62:%.*]] = insertelement <16 x i8> [[TMP61]], i8 [[TMP46]], i32 14 +; CHECK-NEXT:    [[TMP63:%.*]] = insertelement <16 x i8> [[TMP62]], i8 [[TMP47]], i32 15 +; CHECK-NEXT:    [[TMP64:%.*]] = sext <16 x i8> [[TMP63]] to <16 x i32> +; CHECK-NEXT:    [[TMP65:%.*]] = mul <16 x i32> [[BROADCAST_SPLAT]], [[TMP64]] +; CHECK-NEXT:    [[TMP66]] = or <16 x i32> [[TMP65]], [[VEC_PHI]] +; CHECK-NEXT:    [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 16 +; CHECK-NEXT:    [[TMP67:%.*]] = icmp eq i64 [[INDEX_NEXT]], 48 +; CHECK-NEXT:    br i1 [[TMP67]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP22:![0-9]+]] +; CHECK:       [[MIDDLE_BLOCK]]: +; CHECK-NEXT:    [[TMP68:%.*]] = call i32 @llvm.vector.reduce.or.v16i32(<16 x i32> [[TMP66]]) +; CHECK-NEXT:    br label %[[SCALAR_PH:.*]] +; CHECK:       [[SCALAR_PH]]: +; +entry: +  br label %loop + +loop: +  %iv = phi i64 [ %iv.next, %loop ], [ 0, %entry ] +  %reduction = phi i32 [ %reduction.next, %loop ], [ 0, %entry ] +  %gep = getelementptr [32 x i8], ptr %src, i64 %iv +  %load = load i8, ptr %gep, align 1 +  %sext = sext i8 %load to i32 +  %mul = mul i32 %scale, %sext +  %reduction.next = or i32 %mul, %reduction +  %iv.next = add i64 %iv, 2 +  %cmp = icmp eq i64 %iv.next, 100 +  br i1 %cmp, label %exit, label %loop + +exit: +  ret i32 %reduction.next +} +  attributes #0 = { "target-cpu"="neoverse-512tvb" }  !0 = !{!1, !2, i64 0} diff --git a/llvm/test/Transforms/LoopVectorize/X86/uniform_load.ll b/llvm/test/Transforms/LoopVectorize/X86/uniform_load.ll index d4004da..8081c0e 100644 --- a/llvm/test/Transforms/LoopVectorize/X86/uniform_load.ll +++ b/llvm/test/Transforms/LoopVectorize/X86/uniform_load.ll @@ -64,39 +64,24 @@ exit:  define void @uniform_load_can_fold_users(ptr noalias %src, ptr %dst, i64 %start, double %d) {  ; CHECK-LABEL: define void @uniform_load_can_fold_users(  ; CHECK-SAME: ptr noalias [[SRC:%.*]], ptr [[DST:%.*]], i64 [[START:%.*]], double [[D:%.*]]) { -; CHECK-NEXT:  [[ENTRY:.*:]] -; CHECK-NEXT:    [[TMP0:%.*]] = add i64 [[START]], 1 -; CHECK-NEXT:    [[SMIN:%.*]] = call i64 @llvm.smin.i64(i64 [[START]], i64 0) -; CHECK-NEXT:    [[TMP1:%.*]] = sub i64 [[TMP0]], [[SMIN]] -; CHECK-NEXT:    [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[TMP1]], 2 -; CHECK-NEXT:    br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_PH:.*]] -; CHECK:       [[VECTOR_PH]]: -; CHECK-NEXT:    [[N_MOD_VF:%.*]] = urem i64 [[TMP1]], 2 -; CHECK-NEXT:    [[N_VEC:%.*]] = sub i64 [[TMP1]], [[N_MOD_VF]] -; CHECK-NEXT:    [[TMP2:%.*]] = sub i64 [[START]], [[N_VEC]] -; CHECK-NEXT:    br label %[[VECTOR_BODY:.*]] -; CHECK:       [[VECTOR_BODY]]: -; CHECK-NEXT:    [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ] -; CHECK-NEXT:    [[TMP3:%.*]] = add i64 [[INDEX]], 0 -; CHECK-NEXT:    [[TMP4:%.*]] = add i64 [[INDEX]], 1 +; CHECK-NEXT:  [[ENTRY:.*]]: +; CHECK-NEXT:    br label %[[LOOP:.*]] +; CHECK:       [[LOOP]]: +; CHECK-NEXT:    [[TMP4:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_1_NEXT:%.*]], %[[LOOP]] ] +; CHECK-NEXT:    [[IV_2:%.*]] = phi i64 [ [[START]], %[[ENTRY]] ], [ [[IV_2_NEXT:%.*]], %[[LOOP]] ]  ; CHECK-NEXT:    [[TMP5:%.*]] = load double, ptr [[SRC]], align 8 -; CHECK-NEXT:    [[BROADCAST_SPLATINSERT:%.*]] = insertelement <2 x double> poison, double [[TMP5]], i64 0 -; CHECK-NEXT:    [[BROADCAST_SPLAT:%.*]] = shufflevector <2 x double> [[BROADCAST_SPLATINSERT]], <2 x double> poison, <2 x i32> zeroinitializer -; CHECK-NEXT:    [[TMP6:%.*]] = fmul <2 x double> [[BROADCAST_SPLAT]], splat (double 9.000000e+00) -; CHECK-NEXT:    [[TMP7:%.*]] = extractelement <2 x double> [[TMP6]], i32 0 +; CHECK-NEXT:    [[TMP7:%.*]] = fmul double [[TMP5]], 9.000000e+00  ; CHECK-NEXT:    [[TMP8:%.*]] = fdiv double [[TMP7]], [[D]] -; CHECK-NEXT:    [[TMP9:%.*]] = sub i64 [[TMP3]], 1  ; CHECK-NEXT:    [[TMP10:%.*]] = sub i64 [[TMP4]], 1 -; CHECK-NEXT:    [[TMP11:%.*]] = getelementptr double, ptr [[DST]], i64 [[TMP3]]  ; CHECK-NEXT:    [[TMP12:%.*]] = getelementptr double, ptr [[DST]], i64 [[TMP4]] -; CHECK-NEXT:    [[TMP13:%.*]] = getelementptr double, ptr [[TMP11]], i64 [[TMP9]]  ; CHECK-NEXT:    [[TMP14:%.*]] = getelementptr double, ptr [[TMP12]], i64 [[TMP10]] -; CHECK-NEXT:    store double [[TMP8]], ptr [[TMP13]], align 8  ; CHECK-NEXT:    store double [[TMP8]], ptr [[TMP14]], align 8 -; CHECK-NEXT:    [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 2 -; CHECK-NEXT:    [[TMP15:%.*]] = icmp eq i64 [[INDEX_NEXT]], [[N_VEC]] -; CHECK-NEXT:    br i1 [[TMP15]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP3:![0-9]+]] -; CHECK:       [[MIDDLE_BLOCK]]: +; CHECK-NEXT:    [[IV_1_NEXT]] = add i64 [[TMP4]], 1 +; CHECK-NEXT:    [[IV_2_NEXT]] = add i64 [[IV_2]], -1 +; CHECK-NEXT:    [[EC:%.*]] = icmp sgt i64 [[IV_2]], 0 +; CHECK-NEXT:    br i1 [[EC]], label %[[LOOP]], label %[[EXIT:.*]] +; CHECK:       [[EXIT]]: +; CHECK-NEXT:    ret void  ;  entry:    br label %loop diff --git a/llvm/test/Transforms/LoopVectorize/single-scalar-cast-minbw.ll b/llvm/test/Transforms/LoopVectorize/single-scalar-cast-minbw.ll index 9a69982..70adac2 100644 --- a/llvm/test/Transforms/LoopVectorize/single-scalar-cast-minbw.ll +++ b/llvm/test/Transforms/LoopVectorize/single-scalar-cast-minbw.ll @@ -84,12 +84,8 @@ define void @single_scalar_cast_stored(ptr %src, ptr %dst, i32 %n) {  ; CHECK:       [[VECTOR_BODY]]:  ; CHECK-NEXT:    [[INDEX:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ]  ; CHECK-NEXT:    [[TMP0:%.*]] = load i16, ptr [[SRC]], align 2, !alias.scope [[META4:![0-9]+]] -; CHECK-NEXT:    [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x i16> poison, i16 [[TMP0]], i64 0 -; CHECK-NEXT:    [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x i16> [[BROADCAST_SPLATINSERT]], <4 x i16> poison, <4 x i32> zeroinitializer -; CHECK-NEXT:    [[TMP1:%.*]] = icmp eq <4 x i16> [[BROADCAST_SPLAT]], zeroinitializer -; CHECK-NEXT:    [[TMP2:%.*]] = and <4 x i16> [[BROADCAST_SPLAT]], splat (i16 15) -; CHECK-NEXT:    [[TMP3:%.*]] = extractelement <4 x i1> [[TMP1]], i32 0 -; CHECK-NEXT:    [[TMP4:%.*]] = extractelement <4 x i16> [[TMP2]], i32 0 +; CHECK-NEXT:    [[TMP3:%.*]] = icmp eq i16 [[TMP0]], 0 +; CHECK-NEXT:    [[TMP4:%.*]] = and i16 [[TMP0]], 15  ; CHECK-NEXT:    [[TMP5:%.*]] = select i1 [[TMP3]], i16 0, i16 [[TMP4]]  ; CHECK-NEXT:    store i16 [[TMP5]], ptr [[DST]], align 2, !alias.scope [[META7:![0-9]+]], !noalias [[META4]]  ; CHECK-NEXT:    [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 4 diff --git a/llvm/test/Transforms/LoopVectorize/vplan-printing-reductions.ll b/llvm/test/Transforms/LoopVectorize/vplan-printing-reductions.ll index 291ada8..ef678ff 100644 --- a/llvm/test/Transforms/LoopVectorize/vplan-printing-reductions.ll +++ b/llvm/test/Transforms/LoopVectorize/vplan-printing-reductions.ll @@ -804,9 +804,9 @@ exit:  define i32 @print_mulacc_extended_const(ptr %start, ptr %end) {  ; CHECK-LABEL: 'print_mulacc_extended_const'  ; CHECK:       VPlan 'Initial VPlan for VF={4},UF>=1' { -; CHECK-NEXT:  Live-in vp<%0> = VF -; CHECK-NEXT:  Live-in vp<%1> = VF * UF -; CHECK-NEXT:  Live-in vp<%2> = vector-trip-count +; CHECK-NEXT:  Live-in vp<[[VF:%.+]]> = VF +; CHECK-NEXT:  Live-in vp<[[VFxUF:%.+]]> = VF * UF +; CHECK-NEXT:  Live-in vp<[[VTC:%.+]]> = vector-trip-count  ; CHECK-NEXT:  vp<%3> = original trip-count  ; CHECK-EMPTY:  ; CHECK-NEXT:  ir-bb<entry>: @@ -814,107 +814,84 @@ define i32 @print_mulacc_extended_const(ptr %start, ptr %end) {  ; CHECK-NEXT:  Successor(s): scalar.ph, vector.ph  ; CHECK-EMPTY:  ; CHECK-NEXT:  vector.ph: -; CHECK-NEXT:    vp<%4> = DERIVED-IV ir<%start> + vp<%2> * ir<1> -; CHECK-NEXT:    EMIT vp<%5> = reduction-start-vector ir<0>, ir<0>, ir<1> +; CHECK-NEXT:    vp<[[DER_IV:%.+]]> = DERIVED-IV ir<%start> + vp<[[VTC]]> * ir<1> +; CHECK-NEXT:    EMIT vp<[[RDX_START:%.+]]> = reduction-start-vector ir<0>, ir<0>, ir<1>  ; CHECK-NEXT:  Successor(s): vector loop  ; CHECK-EMPTY:  ; CHECK-NEXT:  <x1> vector loop: {  ; CHECK-NEXT:    vector.body: -; CHECK-NEXT:      EMIT vp<%6> = CANONICAL-INDUCTION ir<0>, vp<%index.next> -; CHECK-NEXT:      WIDEN-REDUCTION-PHI ir<%red> = phi vp<%5>, vp<%9> -; CHECK-NEXT:      vp<%7> = SCALAR-STEPS vp<%6>, ir<1>, vp<%0> -; CHECK-NEXT:      EMIT vp<%next.gep> = ptradd ir<%start>, vp<%7> -; CHECK-NEXT:      vp<%8> = vector-pointer vp<%next.gep> -; CHECK-NEXT:      WIDEN ir<%l> = load vp<%8> -; CHECK-NEXT:      EXPRESSION vp<%9> = ir<%red> + reduce.add (mul (ir<%l> zext to i32), (ir<63> zext to i32)) -; CHECK-NEXT:      EMIT vp<%index.next> = add nuw vp<%6>, vp<%1> -; CHECK-NEXT:      EMIT branch-on-count vp<%index.next>, vp<%2> +; CHECK-NEXT:      EMIT vp<[[CAN_IV:%.+]]> = CANONICAL-INDUCTION ir<0>, vp<[[IV_NEXT:%.+]]> +; CHECK-NEXT:      WIDEN-REDUCTION-PHI ir<[[RDX:%.+]]> = phi vp<[[RDX_START]]>, vp<[[RDX_NEXT:%.+]]> +; CHECK-NEXT:      vp<[[STEPS:%.+]]> = SCALAR-STEPS vp<[[CAN_IV]]>, ir<1>, vp<[[VF]]> +; CHECK-NEXT:      EMIT vp<%next.gep> = ptradd ir<%start>, vp<[[STEPS]]> +; CHECK-NEXT:      vp<[[VEC_PTR:%.+]]> = vector-pointer vp<%next.gep> +; CHECK-NEXT:      WIDEN ir<%l> = load vp<[[VEC_PTR]]> +; CHECK-NEXT:      EXPRESSION vp<[[RDX_NEXT]]> = ir<[[RDX]]> + reduce.add (mul (ir<%l> zext to i32), (ir<63> zext to i32)) +; CHECK-NEXT:      EMIT vp<[[IV_NEXT]]> = add nuw vp<[[CAN_IV]]>, vp<[[VFxUF]]> +; CHECK-NEXT:      EMIT branch-on-count vp<[[IV_NEXT]]>, vp<[[VTC]]>  ; CHECK-NEXT:    No successors  ; CHECK-NEXT:  }  ; CHECK-NEXT:  Successor(s): middle.block  ; CHECK-EMPTY:  ; CHECK-NEXT:  middle.block: -; CHECK-NEXT:    EMIT vp<%11> = compute-reduction-result ir<%red>, vp<%9> -; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq vp<%3>, vp<%2> +; CHECK-NEXT:    EMIT vp<%11> = compute-reduction-result ir<[[RDX]]>, vp<[[RDX_NEXT]]> +; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq vp<%3>, vp<[[VTC]]>  ; CHECK-NEXT:    EMIT branch-on-cond vp<%cmp.n> -; CHECK-NEXT:  Successor(s): ir-bb<exit>, scalar.ph -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<exit>: -; CHECK-NEXT:    IR   %red.next.lcssa = phi i32 [ %red.next, %loop ] (extra operand: vp<%11> from middle.block) -; CHECK-NEXT:  No successors -; CHECK-EMPTY: -; CHECK-NEXT:  scalar.ph: -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.resume.val> = phi [ vp<%4>, middle.block ], [ ir<%start>, ir-bb<entry> ] -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.merge.rdx> = phi [ vp<%11>, middle.block ], [ ir<0>, ir-bb<entry> ] -; CHECK-NEXT:  Successor(s): ir-bb<loop> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<loop>: -; CHECK-NEXT:    IR   %ptr.iv = phi ptr [ %start, %entry ], [ %gep.iv.next, %loop ] (extra operand: vp<%bc.resume.val> from scalar.ph) -; CHECK-NEXT:    IR   %red = phi i32 [ 0, %entry ], [ %red.next, %loop ] (extra operand: vp<%bc.merge.rdx> from scalar.ph) -; CHECK-NEXT:    IR   %l = load i8, ptr %ptr.iv, align 1 -; CHECK-NEXT:    IR   %l.ext = zext i8 %l to i32 -; CHECK-NEXT:    IR   %mul = mul i32 %l.ext, 63 -; CHECK-NEXT:    IR   %red.next = add i32 %red, %mul -; CHECK-NEXT:    IR   %gep.iv.next = getelementptr i8, ptr %ptr.iv, i64 1 -; CHECK-NEXT:    IR   %ec = icmp eq ptr %ptr.iv, %end -; CHECK-NEXT:  No successors -; CHECK-NEXT:  } -; CHECK:       VPlan 'Final VPlan for VF={4},UF={1}' { -; CHECK-NEXT:  Live-in ir<%1> = original trip-count +entry: +  br label %loop + +loop: +  %ptr.iv = phi ptr [ %start, %entry ], [ %gep.iv.next, %loop ] +  %red = phi i32 [ 0, %entry ], [ %red.next, %loop ] +  %l = load i8, ptr %ptr.iv, align 1 +  %l.ext = zext i8 %l to i32 +  %mul = mul i32 %l.ext, 63 +  %red.next = add i32 %red, %mul +  %gep.iv.next = getelementptr i8, ptr %ptr.iv, i64 1 +  %ec = icmp eq ptr %ptr.iv, %end +  br i1 %ec, label %exit, label %loop + +exit: +  ret i32 %red.next +} + +define i32 @print_mulacc_extended_const_lhs(ptr %start, ptr %end) { +; CHECK-LABEL: 'print_mulacc_extended_const_lhs' +; CHECK:       VPlan 'Initial VPlan for VF={4},UF>=1' { +; CHECK-NEXT:  Live-in vp<[[VF:%.+]]> = VF +; CHECK-NEXT:  Live-in vp<[[VFxUF:%.+]]> = VF * UF +; CHECK-NEXT:  Live-in vp<[[VTC:%.+]]> = vector-trip-count +; CHECK-NEXT:  vp<%3> = original trip-count  ; CHECK-EMPTY:  ; CHECK-NEXT:  ir-bb<entry>: -; CHECK-NEXT:    IR   %start2 = ptrtoint ptr %start to i64 -; CHECK-NEXT:    IR   %end1 = ptrtoint ptr %end to i64 -; CHECK-NEXT:    IR   %0 = add i64 %end1, 1 -; CHECK-NEXT:    IR   %1 = sub i64 %0, %start2 -; CHECK-NEXT:    EMIT vp<%min.iters.check> = icmp ult ir<%1>, ir<4> -; CHECK-NEXT:    EMIT branch-on-cond vp<%min.iters.check> -; CHECK-NEXT:  Successor(s): ir-bb<scalar.ph>, vector.ph +; CHECK-NEXT:    EMIT vp<%3> = EXPAND SCEV (1 + (-1 * (ptrtoint ptr %start to i64)) + (ptrtoint ptr %end to i64)) +; CHECK-NEXT:  Successor(s): scalar.ph, vector.ph  ; CHECK-EMPTY:  ; CHECK-NEXT:  vector.ph: -; CHECK-NEXT:    EMIT vp<%n.mod.vf> = urem ir<%1>, ir<4> -; CHECK-NEXT:    EMIT vp<%n.vec> = sub ir<%1>, vp<%n.mod.vf> -; CHECK-NEXT:    vp<%3> = DERIVED-IV ir<%start> + vp<%n.vec> * ir<1> -; CHECK-NEXT:  Successor(s): vector.body -; CHECK-EMPTY: -; CHECK-NEXT:  vector.body: -; CHECK-NEXT:    EMIT-SCALAR vp<%index> = phi [ ir<0>, vector.ph ], [ vp<%index.next>, vector.body ] -; CHECK-NEXT:    WIDEN-REDUCTION-PHI ir<%red> = phi ir<0>, ir<%red.next> -; CHECK-NEXT:    EMIT vp<%next.gep> = ptradd ir<%start>, vp<%index> -; CHECK-NEXT:    WIDEN ir<%l> = load vp<%next.gep> -; CHECK-NEXT:    WIDEN-CAST ir<%l.ext> = zext ir<%l> to i32 -; CHECK-NEXT:    WIDEN ir<%mul> = mul ir<%l.ext>, ir<63> -; CHECK-NEXT:    REDUCE ir<%red.next> = ir<%red> +  reduce.add (ir<%mul>) -; CHECK-NEXT:    EMIT vp<%index.next> = add nuw vp<%index>, ir<4> -; CHECK-NEXT:    EMIT branch-on-count vp<%index.next>, vp<%n.vec> -; CHECK-NEXT:  Successor(s): middle.block, vector.body +; CHECK-NEXT:    vp<[[DER_IV:%.+]]> = DERIVED-IV ir<%start> + vp<[[VTC]]> * ir<1> +; CHECK-NEXT:    EMIT vp<[[RDX_START:%.+]]> = reduction-start-vector ir<0>, ir<0>, ir<1> +; CHECK-NEXT:  Successor(s): vector loop +; CHECK-EMPTY: +; CHECK-NEXT:  <x1> vector loop: { +; CHECK-NEXT:    vector.body: +; CHECK-NEXT:      EMIT vp<[[CAN_IV:%.+]]> = CANONICAL-INDUCTION ir<0>, vp<[[IV_NEXT:%.+]]> +; CHECK-NEXT:      WIDEN-REDUCTION-PHI ir<[[RDX:%.+]]> = phi vp<[[RDX_START]]>, vp<[[RDX_NEXT:%.+]]> +; CHECK-NEXT:      vp<[[STEPS:%.+]]> = SCALAR-STEPS vp<[[CAN_IV]]>, ir<1>, vp<[[VF]]> +; CHECK-NEXT:      EMIT vp<%next.gep> = ptradd ir<%start>, vp<[[STEPS]]> +; CHECK-NEXT:      vp<[[VEC_PTR:%.+]]> = vector-pointer vp<%next.gep> +; CHECK-NEXT:      WIDEN ir<%l> = load vp<[[VEC_PTR]]> +; CHECK-NEXT:      WIDEN-CAST ir<%l.ext> = zext ir<%l> to i32 +; CHECK-NEXT:      EXPRESSION vp<[[RDX_NEXT]]> = ir<[[RDX]]> + reduce.add (mul ir<63>, ir<%l.ext>) +; CHECK-NEXT:      EMIT vp<[[IV_NEXT]]> = add nuw vp<[[CAN_IV]]>, vp<[[VFxUF]]> +; CHECK-NEXT:      EMIT branch-on-count vp<[[IV_NEXT]]>, vp<[[VTC]]> +; CHECK-NEXT:    No successors +; CHECK-NEXT:  } +; CHECK-NEXT:  Successor(s): middle.block  ; CHECK-EMPTY:  ; CHECK-NEXT:  middle.block: -; CHECK-NEXT:    EMIT vp<%5> = compute-reduction-result ir<%red>, ir<%red.next> -; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq ir<%1>, vp<%n.vec> +; CHECK-NEXT:    EMIT vp<%11> = compute-reduction-result ir<[[RDX]]>, vp<[[RDX_NEXT]]> +; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq vp<%3>, vp<[[VTC]]>  ; CHECK-NEXT:    EMIT branch-on-cond vp<%cmp.n> -; CHECK-NEXT:  Successor(s): ir-bb<exit>, ir-bb<scalar.ph> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<exit>: -; CHECK-NEXT:    IR   %red.next.lcssa = phi i32 [ %red.next, %loop ] (extra operand: vp<%5> from middle.block) -; CHECK-NEXT:  No successors -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<scalar.ph>: -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.resume.val> = phi [ vp<%3>, middle.block ], [ ir<%start>, ir-bb<entry> ] -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.merge.rdx> = phi [ vp<%5>, middle.block ], [ ir<0>, ir-bb<entry> ] -; CHECK-NEXT:  Successor(s): ir-bb<loop> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<loop>: -; CHECK-NEXT:    IR   %ptr.iv = phi ptr [ %start, %scalar.ph ], [ %gep.iv.next, %loop ] (extra operand: vp<%bc.resume.val> from ir-bb<scalar.ph>) -; CHECK-NEXT:    IR   %red = phi i32 [ 0, %scalar.ph ], [ %red.next, %loop ] (extra operand: vp<%bc.merge.rdx> from ir-bb<scalar.ph>) -; CHECK-NEXT:    IR   %l = load i8, ptr %ptr.iv, align 1 -; CHECK-NEXT:    IR   %l.ext = zext i8 %l to i32 -; CHECK-NEXT:    IR   %mul = mul i32 %l.ext, 63 -; CHECK-NEXT:    IR   %red.next = add i32 %red, %mul -; CHECK-NEXT:    IR   %gep.iv.next = getelementptr i8, ptr %ptr.iv, i64 1 -; CHECK-NEXT:    IR   %ec = icmp eq ptr %ptr.iv, %end -; CHECK-NEXT:  No successors -; CHECK-NEXT:  }  entry:    br label %loop @@ -923,7 +900,7 @@ loop:    %red = phi i32 [ 0, %entry ], [ %red.next, %loop ]    %l = load i8, ptr %ptr.iv, align 1    %l.ext = zext i8 %l to i32 -  %mul = mul i32 %l.ext, 63 +  %mul = mul i32 63, %l.ext    %red.next = add i32 %red, %mul    %gep.iv.next = getelementptr i8, ptr %ptr.iv, i64 1    %ec = icmp eq ptr %ptr.iv, %end @@ -937,9 +914,9 @@ exit:  define i32 @print_mulacc_not_extended_const(ptr %start, ptr %end) {  ; CHECK-LABEL: 'print_mulacc_not_extended_const'  ; CHECK:       VPlan 'Initial VPlan for VF={4},UF>=1' { -; CHECK-NEXT:  Live-in vp<%0> = VF -; CHECK-NEXT:  Live-in vp<%1> = VF * UF -; CHECK-NEXT:  Live-in vp<%2> = vector-trip-count +; CHECK-NEXT:  Live-in vp<[[VF:%.+]]> = VF +; CHECK-NEXT:  Live-in vp<[[VFxUF:%.+]]> = VF * UF +; CHECK-NEXT:  Live-in vp<[[VTC:%.+]]> = vector-trip-count  ; CHECK-NEXT:  vp<%3> = original trip-count  ; CHECK-EMPTY:  ; CHECK-NEXT:  ir-bb<entry>: @@ -947,108 +924,30 @@ define i32 @print_mulacc_not_extended_const(ptr %start, ptr %end) {  ; CHECK-NEXT:  Successor(s): scalar.ph, vector.ph  ; CHECK-EMPTY:  ; CHECK-NEXT:  vector.ph: -; CHECK-NEXT:    vp<%4> = DERIVED-IV ir<%start> + vp<%2> * ir<1> -; CHECK-NEXT:    EMIT vp<%5> = reduction-start-vector ir<0>, ir<0>, ir<1> +; CHECK-NEXT:    vp<[[DER_IV:%.+]]> = DERIVED-IV ir<%start> + vp<[[VTC]]> * ir<1> +; CHECK-NEXT:    EMIT vp<[[RDX_START:%.+]]> = reduction-start-vector ir<0>, ir<0>, ir<1>  ; CHECK-NEXT:  Successor(s): vector loop  ; CHECK-EMPTY:  ; CHECK-NEXT:  <x1> vector loop: {  ; CHECK-NEXT:    vector.body: -; CHECK-NEXT:      EMIT vp<%6> = CANONICAL-INDUCTION ir<0>, vp<%index.next> -; CHECK-NEXT:      WIDEN-REDUCTION-PHI ir<%red> = phi vp<%5>, vp<%9> -; CHECK-NEXT:      vp<%7> = SCALAR-STEPS vp<%6>, ir<1>, vp<%0> -; CHECK-NEXT:      EMIT vp<%next.gep> = ptradd ir<%start>, vp<%7> -; CHECK-NEXT:      vp<%8> = vector-pointer vp<%next.gep> -; CHECK-NEXT:      WIDEN ir<%l> = load vp<%8> +; CHECK-NEXT:      EMIT vp<[[CAN_IV:%.+]]> = CANONICAL-INDUCTION ir<0>, vp<[[IV_NEXT:%.+]]> +; CHECK-NEXT:      WIDEN-REDUCTION-PHI ir<[[RDX:%.+]]> = phi vp<[[RDX_START]]>, vp<[[RDX_NEXT:%.+]]> +; CHECK-NEXT:      vp<[[STEPS:%.+]]> = SCALAR-STEPS vp<[[CAN_IV]]>, ir<1>, vp<[[VF]]> +; CHECK-NEXT:      EMIT vp<%next.gep> = ptradd ir<%start>, vp<[[STEPS]]> +; CHECK-NEXT:      vp<[[VEC_PTR:%.+]]> = vector-pointer vp<%next.gep> +; CHECK-NEXT:      WIDEN ir<%l> = load vp<[[VEC_PTR]]>  ; CHECK-NEXT:      WIDEN-CAST ir<%l.ext> = sext ir<%l> to i32 -; CHECK-NEXT:      EXPRESSION vp<%9> = ir<%red> + reduce.add (mul ir<%l.ext>, ir<128>) -; CHECK-NEXT:      EMIT vp<%index.next> = add nuw vp<%6>, vp<%1> -; CHECK-NEXT:      EMIT branch-on-count vp<%index.next>, vp<%2> +; CHECK-NEXT:      EXPRESSION vp<[[RDX_NEXT]]> = ir<[[RDX]]> + reduce.add (mul ir<%l.ext>, ir<128>) +; CHECK-NEXT:      EMIT vp<[[IV_NEXT]]> = add nuw vp<[[CAN_IV]]>, vp<[[VFxUF]]> +; CHECK-NEXT:      EMIT branch-on-count vp<[[IV_NEXT]]>, vp<[[VTC]]>  ; CHECK-NEXT:    No successors  ; CHECK-NEXT:  }  ; CHECK-NEXT:  Successor(s): middle.block  ; CHECK-EMPTY:  ; CHECK-NEXT:  middle.block: -; CHECK-NEXT:    EMIT vp<%11> = compute-reduction-result ir<%red>, vp<%9> -; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq vp<%3>, vp<%2> +; CHECK-NEXT:    EMIT vp<%11> = compute-reduction-result ir<[[RDX:%.+]]>, vp<[[RDX_NEXT]]> +; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq vp<%3>, vp<[[VTC]]>  ; CHECK-NEXT:    EMIT branch-on-cond vp<%cmp.n> -; CHECK-NEXT:  Successor(s): ir-bb<exit>, scalar.ph -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<exit>: -; CHECK-NEXT:    IR   %red.next.lcssa = phi i32 [ %red.next, %loop ] (extra operand: vp<%11> from middle.block) -; CHECK-NEXT:  No successors -; CHECK-EMPTY: -; CHECK-NEXT:  scalar.ph: -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.resume.val> = phi [ vp<%4>, middle.block ], [ ir<%start>, ir-bb<entry> ] -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.merge.rdx> = phi [ vp<%11>, middle.block ], [ ir<0>, ir-bb<entry> ] -; CHECK-NEXT:  Successor(s): ir-bb<loop> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<loop>: -; CHECK-NEXT:    IR   %ptr.iv = phi ptr [ %start, %entry ], [ %gep.iv.next, %loop ] (extra operand: vp<%bc.resume.val> from scalar.ph) -; CHECK-NEXT:    IR   %red = phi i32 [ 0, %entry ], [ %red.next, %loop ] (extra operand: vp<%bc.merge.rdx> from scalar.ph) -; CHECK-NEXT:    IR   %l = load i8, ptr %ptr.iv, align 1 -; CHECK-NEXT:    IR   %l.ext = sext i8 %l to i32 -; CHECK-NEXT:    IR   %mul = mul i32 %l.ext, 128 -; CHECK-NEXT:    IR   %red.next = add i32 %red, %mul -; CHECK-NEXT:    IR   %gep.iv.next = getelementptr i8, ptr %ptr.iv, i64 1 -; CHECK-NEXT:    IR   %ec = icmp eq ptr %ptr.iv, %end -; CHECK-NEXT:  No successors -; CHECK-NEXT:  } -; CHECK:       VPlan 'Final VPlan for VF={4},UF={1}' { -; CHECK-NEXT:  Live-in ir<%1> = original trip-count -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<entry>: -; CHECK-NEXT:    IR   %start2 = ptrtoint ptr %start to i64 -; CHECK-NEXT:    IR   %end1 = ptrtoint ptr %end to i64 -; CHECK-NEXT:    IR   %0 = add i64 %end1, 1 -; CHECK-NEXT:    IR   %1 = sub i64 %0, %start2 -; CHECK-NEXT:    EMIT vp<%min.iters.check> = icmp ult ir<%1>, ir<4> -; CHECK-NEXT:    EMIT branch-on-cond vp<%min.iters.check> -; CHECK-NEXT:  Successor(s): ir-bb<scalar.ph>, vector.ph -; CHECK-EMPTY: -; CHECK-NEXT:  vector.ph: -; CHECK-NEXT:    EMIT vp<%n.mod.vf> = urem ir<%1>, ir<4> -; CHECK-NEXT:    EMIT vp<%n.vec> = sub ir<%1>, vp<%n.mod.vf> -; CHECK-NEXT:    vp<%3> = DERIVED-IV ir<%start> + vp<%n.vec> * ir<1> -; CHECK-NEXT:  Successor(s): vector.body -; CHECK-EMPTY: -; CHECK-NEXT:  vector.body: -; CHECK-NEXT:    EMIT-SCALAR vp<%index> = phi [ ir<0>, vector.ph ], [ vp<%index.next>, vector.body ] -; CHECK-NEXT:    WIDEN-REDUCTION-PHI ir<%red> = phi ir<0>, ir<%red.next> -; CHECK-NEXT:    EMIT vp<%next.gep> = ptradd ir<%start>, vp<%index> -; CHECK-NEXT:    WIDEN ir<%l> = load vp<%next.gep> -; CHECK-NEXT:    WIDEN-CAST ir<%l.ext> = sext ir<%l> to i32 -; CHECK-NEXT:    WIDEN ir<%mul> = mul ir<%l.ext>, ir<128> -; CHECK-NEXT:    REDUCE ir<%red.next> = ir<%red> +  reduce.add (ir<%mul>) -; CHECK-NEXT:    EMIT vp<%index.next> = add nuw vp<%index>, ir<4> -; CHECK-NEXT:    EMIT branch-on-count vp<%index.next>, vp<%n.vec> -; CHECK-NEXT:  Successor(s): middle.block, vector.body -; CHECK-EMPTY: -; CHECK-NEXT:  middle.block: -; CHECK-NEXT:    EMIT vp<%5> = compute-reduction-result ir<%red>, ir<%red.next> -; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq ir<%1>, vp<%n.vec> -; CHECK-NEXT:    EMIT branch-on-cond vp<%cmp.n> -; CHECK-NEXT:  Successor(s): ir-bb<exit>, ir-bb<scalar.ph> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<exit>: -; CHECK-NEXT:    IR   %red.next.lcssa = phi i32 [ %red.next, %loop ] (extra operand: vp<%5> from middle.block) -; CHECK-NEXT:  No successors -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<scalar.ph>: -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.resume.val> = phi [ vp<%3>, middle.block ], [ ir<%start>, ir-bb<entry> ] -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.merge.rdx> = phi [ vp<%5>, middle.block ], [ ir<0>, ir-bb<entry> ] -; CHECK-NEXT:  Successor(s): ir-bb<loop> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<loop>: -; CHECK-NEXT:    IR   %ptr.iv = phi ptr [ %start, %scalar.ph ], [ %gep.iv.next, %loop ] (extra operand: vp<%bc.resume.val> from ir-bb<scalar.ph>) -; CHECK-NEXT:    IR   %red = phi i32 [ 0, %scalar.ph ], [ %red.next, %loop ] (extra operand: vp<%bc.merge.rdx> from ir-bb<scalar.ph>) -; CHECK-NEXT:    IR   %l = load i8, ptr %ptr.iv, align 1 -; CHECK-NEXT:    IR   %l.ext = sext i8 %l to i32 -; CHECK-NEXT:    IR   %mul = mul i32 %l.ext, 128 -; CHECK-NEXT:    IR   %red.next = add i32 %red, %mul -; CHECK-NEXT:    IR   %gep.iv.next = getelementptr i8, ptr %ptr.iv, i64 1 -; CHECK-NEXT:    IR   %ec = icmp eq ptr %ptr.iv, %end -; CHECK-NEXT:  No successors -; CHECK-NEXT:  }  entry:    br label %loop @@ -1071,9 +970,9 @@ exit:  define i64 @print_ext_mulacc_extended_const(ptr %start, ptr %end) {  ; CHECK-LABEL: 'print_ext_mulacc_extended_const'  ; CHECK:       VPlan 'Initial VPlan for VF={4},UF>=1' { -; CHECK-NEXT:  Live-in vp<%0> = VF -; CHECK-NEXT:  Live-in vp<%1> = VF * UF -; CHECK-NEXT:  Live-in vp<%2> = vector-trip-count +; CHECK-NEXT:  Live-in vp<[[VF:%.+]]> = VF +; CHECK-NEXT:  Live-in vp<[[VFxUF:%.+]]> = VF * UF +; CHECK-NEXT:  Live-in vp<[[VTC:%.+]]> = vector-trip-count  ; CHECK-NEXT:  vp<%3> = original trip-count  ; CHECK-EMPTY:  ; CHECK-NEXT:  ir-bb<entry>: @@ -1081,109 +980,29 @@ define i64 @print_ext_mulacc_extended_const(ptr %start, ptr %end) {  ; CHECK-NEXT:  Successor(s): scalar.ph, vector.ph  ; CHECK-EMPTY:  ; CHECK-NEXT:  vector.ph: -; CHECK-NEXT:    vp<%4> = DERIVED-IV ir<%start> + vp<%2> * ir<1> -; CHECK-NEXT:    EMIT vp<%5> = reduction-start-vector ir<0>, ir<0>, ir<1> +; CHECK-NEXT:    vp<[[DER_IV:%.+]]> = DERIVED-IV ir<%start> + vp<[[VTC]]> * ir<1> +; CHECK-NEXT:    EMIT vp<[[RDX_START:%.+]]> = reduction-start-vector ir<0>, ir<0>, ir<1>  ; CHECK-NEXT:  Successor(s): vector loop  ; CHECK-EMPTY:  ; CHECK-NEXT:  <x1> vector loop: {  ; CHECK-NEXT:    vector.body: -; CHECK-NEXT:      EMIT vp<%6> = CANONICAL-INDUCTION ir<0>, vp<%index.next> -; CHECK-NEXT:      WIDEN-REDUCTION-PHI ir<%red> = phi vp<%5>, vp<%9> -; CHECK-NEXT:      vp<%7> = SCALAR-STEPS vp<%6>, ir<1>, vp<%0> -; CHECK-NEXT:      EMIT vp<%next.gep> = ptradd ir<%start>, vp<%7> -; CHECK-NEXT:      vp<%8> = vector-pointer vp<%next.gep> -; CHECK-NEXT:      WIDEN ir<%l> = load vp<%8> -; CHECK-NEXT:      EXPRESSION vp<%9> = ir<%red> + reduce.add (mul (ir<%l> zext to i64), (ir<63> zext to i64)) -; CHECK-NEXT:      EMIT vp<%index.next> = add nuw vp<%6>, vp<%1> -; CHECK-NEXT:      EMIT branch-on-count vp<%index.next>, vp<%2> +; CHECK-NEXT:      EMIT vp<[[CAN_IV:%.+]]> = CANONICAL-INDUCTION ir<0>, vp<[[IV_NEXT:%.+]]> +; CHECK-NEXT:      WIDEN-REDUCTION-PHI ir<[[RDX:%.+]]> = phi vp<[[RDX_START]]>, vp<[[RDX_NEXT:%.+]]> +; CHECK-NEXT:      vp<[[STEPS:%.+]]> = SCALAR-STEPS vp<[[CAN_IV]]>, ir<1>, vp<[[VF]]> +; CHECK-NEXT:      EMIT vp<%next.gep> = ptradd ir<%start>, vp<[[STEPS]]> +; CHECK-NEXT:      vp<[[VEC_PTR:%.+]]> = vector-pointer vp<%next.gep> +; CHECK-NEXT:      WIDEN ir<%l> = load vp<[[VEC_PTR]]> +; CHECK-NEXT:      EXPRESSION vp<[[RDX_NEXT]]> = ir<[[RDX]]> + reduce.add (mul (ir<%l> zext to i64), (ir<63> zext to i64)) +; CHECK-NEXT:      EMIT vp<[[IV_NEXT]]> = add nuw vp<[[CAN_IV]]>, vp<[[VFxUF]]> +; CHECK-NEXT:      EMIT branch-on-count vp<[[IV_NEXT]]>, vp<[[VTC]]>  ; CHECK-NEXT:    No successors  ; CHECK-NEXT:  }  ; CHECK-NEXT:  Successor(s): middle.block  ; CHECK-EMPTY:  ; CHECK-NEXT:  middle.block: -; CHECK-NEXT:    EMIT vp<%11> = compute-reduction-result ir<%red>, vp<%9> -; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq vp<%3>, vp<%2> +; CHECK-NEXT:    EMIT vp<%11> = compute-reduction-result ir<[[RDX]]>, vp<[[RDX_NEXT]]> +; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq vp<%3>, vp<[[VTC]]>  ; CHECK-NEXT:    EMIT branch-on-cond vp<%cmp.n> -; CHECK-NEXT:  Successor(s): ir-bb<exit>, scalar.ph -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<exit>: -; CHECK-NEXT:    IR   %red.next.lcssa = phi i64 [ %red.next, %loop ] (extra operand: vp<%11> from middle.block) -; CHECK-NEXT:  No successors -; CHECK-EMPTY: -; CHECK-NEXT:  scalar.ph: -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.resume.val> = phi [ vp<%4>, middle.block ], [ ir<%start>, ir-bb<entry> ] -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.merge.rdx> = phi [ vp<%11>, middle.block ], [ ir<0>, ir-bb<entry> ] -; CHECK-NEXT:  Successor(s): ir-bb<loop> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<loop>: -; CHECK-NEXT:    IR   %ptr.iv = phi ptr [ %start, %entry ], [ %gep.iv.next, %loop ] (extra operand: vp<%bc.resume.val> from scalar.ph) -; CHECK-NEXT:    IR   %red = phi i64 [ 0, %entry ], [ %red.next, %loop ] (extra operand: vp<%bc.merge.rdx> from scalar.ph) -; CHECK-NEXT:    IR   %l = load i8, ptr %ptr.iv, align 1 -; CHECK-NEXT:    IR   %l.ext = zext i8 %l to i32 -; CHECK-NEXT:    IR   %mul = mul i32 %l.ext, 63 -; CHECK-NEXT:    IR   %mul.ext = zext i32 %mul to i64 -; CHECK-NEXT:    IR   %red.next = add i64 %red, %mul.ext -; CHECK-NEXT:    IR   %gep.iv.next = getelementptr i8, ptr %ptr.iv, i64 1 -; CHECK-NEXT:    IR   %ec = icmp eq ptr %ptr.iv, %end -; CHECK-NEXT:  No successors -; CHECK-NEXT:  } -; CHECK:       VPlan 'Final VPlan for VF={4},UF={1}' { -; CHECK-NEXT:  Live-in ir<%1> = original trip-count -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<entry>: -; CHECK-NEXT:    IR   %start2 = ptrtoint ptr %start to i64 -; CHECK-NEXT:    IR   %end1 = ptrtoint ptr %end to i64 -; CHECK-NEXT:    IR   %0 = add i64 %end1, 1 -; CHECK-NEXT:    IR   %1 = sub i64 %0, %start2 -; CHECK-NEXT:    EMIT vp<%min.iters.check> = icmp ult ir<%1>, ir<4> -; CHECK-NEXT:    EMIT branch-on-cond vp<%min.iters.check> -; CHECK-NEXT:  Successor(s): ir-bb<scalar.ph>, vector.ph -; CHECK-EMPTY: -; CHECK-NEXT:  vector.ph: -; CHECK-NEXT:    EMIT vp<%n.mod.vf> = urem ir<%1>, ir<4> -; CHECK-NEXT:    EMIT vp<%n.vec> = sub ir<%1>, vp<%n.mod.vf> -; CHECK-NEXT:    vp<%3> = DERIVED-IV ir<%start> + vp<%n.vec> * ir<1> -; CHECK-NEXT:  Successor(s): vector.body -; CHECK-EMPTY: -; CHECK-NEXT:  vector.body: -; CHECK-NEXT:    EMIT-SCALAR vp<%index> = phi [ ir<0>, vector.ph ], [ vp<%index.next>, vector.body ] -; CHECK-NEXT:    WIDEN-REDUCTION-PHI ir<%red> = phi ir<0>, ir<%red.next> -; CHECK-NEXT:    EMIT vp<%next.gep> = ptradd ir<%start>, vp<%index> -; CHECK-NEXT:    WIDEN ir<%l> = load vp<%next.gep> -; CHECK-NEXT:    WIDEN-CAST vp<%4> = zext ir<%l> to i64 -; CHECK-NEXT:    WIDEN ir<%mul> = mul vp<%4>, ir<63> -; CHECK-NEXT:    REDUCE ir<%red.next> = ir<%red> +  reduce.add (ir<%mul>) -; CHECK-NEXT:    EMIT vp<%index.next> = add nuw vp<%index>, ir<4> -; CHECK-NEXT:    EMIT branch-on-count vp<%index.next>, vp<%n.vec> -; CHECK-NEXT:  Successor(s): middle.block, vector.body -; CHECK-EMPTY: -; CHECK-NEXT:  middle.block: -; CHECK-NEXT:    EMIT vp<%6> = compute-reduction-result ir<%red>, ir<%red.next> -; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq ir<%1>, vp<%n.vec> -; CHECK-NEXT:    EMIT branch-on-cond vp<%cmp.n> -; CHECK-NEXT:  Successor(s): ir-bb<exit>, ir-bb<scalar.ph> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<exit>: -; CHECK-NEXT:    IR   %red.next.lcssa = phi i64 [ %red.next, %loop ] (extra operand: vp<%6> from middle.block) -; CHECK-NEXT:  No successors -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<scalar.ph>: -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.resume.val> = phi [ vp<%3>, middle.block ], [ ir<%start>, ir-bb<entry> ] -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.merge.rdx> = phi [ vp<%6>, middle.block ], [ ir<0>, ir-bb<entry> ] -; CHECK-NEXT:  Successor(s): ir-bb<loop> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<loop>: -; CHECK-NEXT:    IR   %ptr.iv = phi ptr [ %start, %scalar.ph ], [ %gep.iv.next, %loop ] (extra operand: vp<%bc.resume.val> from ir-bb<scalar.ph>) -; CHECK-NEXT:    IR   %red = phi i64 [ 0, %scalar.ph ], [ %red.next, %loop ] (extra operand: vp<%bc.merge.rdx> from ir-bb<scalar.ph>) -; CHECK-NEXT:    IR   %l = load i8, ptr %ptr.iv, align 1 -; CHECK-NEXT:    IR   %l.ext = zext i8 %l to i32 -; CHECK-NEXT:    IR   %mul = mul i32 %l.ext, 63 -; CHECK-NEXT:    IR   %mul.ext = zext i32 %mul to i64 -; CHECK-NEXT:    IR   %red.next = add i64 %red, %mul.ext -; CHECK-NEXT:    IR   %gep.iv.next = getelementptr i8, ptr %ptr.iv, i64 1 -; CHECK-NEXT:    IR   %ec = icmp eq ptr %ptr.iv, %end -; CHECK-NEXT:  No successors -; CHECK-NEXT:  }  entry:    br label %loop @@ -1207,9 +1026,9 @@ exit:  define i64 @print_ext_mulacc_not_extended_const(ptr %start, ptr %end) {  ; CHECK-LABEL: 'print_ext_mulacc_not_extended_const'  ; CHECK:       VPlan 'Initial VPlan for VF={4},UF>=1' { -; CHECK-NEXT:  Live-in vp<%0> = VF -; CHECK-NEXT:  Live-in vp<%1> = VF * UF -; CHECK-NEXT:  Live-in vp<%2> = vector-trip-count +; CHECK-NEXT:  Live-in vp<[[VF:%.+]]> = VF +; CHECK-NEXT:  Live-in vp<[[VFxUF:%.+]]> = VF * UF +; CHECK-NEXT:  Live-in vp<[[VTC:%.+]]> = vector-trip-count  ; CHECK-NEXT:  vp<%3> = original trip-count  ; CHECK-EMPTY:  ; CHECK-NEXT:  ir-bb<entry>: @@ -1217,112 +1036,31 @@ define i64 @print_ext_mulacc_not_extended_const(ptr %start, ptr %end) {  ; CHECK-NEXT:  Successor(s): scalar.ph, vector.ph  ; CHECK-EMPTY:  ; CHECK-NEXT:  vector.ph: -; CHECK-NEXT:    vp<%4> = DERIVED-IV ir<%start> + vp<%2> * ir<1> -; CHECK-NEXT:    EMIT vp<%5> = reduction-start-vector ir<0>, ir<0>, ir<1> +; CHECK-NEXT:    vp<[[DER_IV:%.+]]> = DERIVED-IV ir<%start> + vp<[[VTC]]> * ir<1> +; CHECK-NEXT:    EMIT vp<[[RDX_START:%.+]]> = reduction-start-vector ir<0>, ir<0>, ir<1>  ; CHECK-NEXT:  Successor(s): vector loop  ; CHECK-EMPTY:  ; CHECK-NEXT:  <x1> vector loop: {  ; CHECK-NEXT:    vector.body: -; CHECK-NEXT:      EMIT vp<%6> = CANONICAL-INDUCTION ir<0>, vp<%index.next> -; CHECK-NEXT:      WIDEN-REDUCTION-PHI ir<%red> = phi vp<%5>, vp<%9> -; CHECK-NEXT:      vp<%7> = SCALAR-STEPS vp<%6>, ir<1>, vp<%0> -; CHECK-NEXT:      EMIT vp<%next.gep> = ptradd ir<%start>, vp<%7> -; CHECK-NEXT:      vp<%8> = vector-pointer vp<%next.gep> -; CHECK-NEXT:      WIDEN ir<%l> = load vp<%8> +; CHECK-NEXT:      EMIT vp<[[CAN_IV:%.+]]> = CANONICAL-INDUCTION ir<0>, vp<[[IV_NEXT:%.+]]> +; CHECK-NEXT:      WIDEN-REDUCTION-PHI ir<[[RDX:%.+]]> = phi vp<[[RDX_START]]>, vp<[[RDX_NEXT:%.+]]> +; CHECK-NEXT:      vp<[[STEPS:%.+]]> = SCALAR-STEPS vp<[[CAN_IV]]>, ir<1>, vp<[[VF]]> +; CHECK-NEXT:      EMIT vp<%next.gep> = ptradd ir<%start>, vp<[[STEPS]]> +; CHECK-NEXT:      vp<[[VEC_PTR:%.+]]> = vector-pointer vp<%next.gep> +; CHECK-NEXT:      WIDEN ir<%l> = load vp<[[VEC_PTR]]>  ; CHECK-NEXT:      WIDEN-CAST ir<%l.ext> = sext ir<%l> to i32  ; CHECK-NEXT:      WIDEN ir<%mul> = mul ir<%l.ext>, ir<128> -; CHECK-NEXT:      EXPRESSION vp<%9> = ir<%red> + reduce.add (ir<%mul> sext to i64) -; CHECK-NEXT:      EMIT vp<%index.next> = add nuw vp<%6>, vp<%1> -; CHECK-NEXT:      EMIT branch-on-count vp<%index.next>, vp<%2> +; CHECK-NEXT:      EXPRESSION vp<[[RDX_NEXT]]> = ir<[[RDX]]> + reduce.add (ir<%mul> sext to i64) +; CHECK-NEXT:      EMIT vp<[[IV_NEXT]]> = add nuw vp<[[CAN_IV]]>, vp<[[VFxUF]]> +; CHECK-NEXT:      EMIT branch-on-count vp<[[IV_NEXT]]>, vp<[[VTC]]>  ; CHECK-NEXT:    No successors  ; CHECK-NEXT:  }  ; CHECK-NEXT:  Successor(s): middle.block  ; CHECK-EMPTY:  ; CHECK-NEXT:  middle.block: -; CHECK-NEXT:    EMIT vp<%11> = compute-reduction-result ir<%red>, vp<%9> -; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq vp<%3>, vp<%2> -; CHECK-NEXT:    EMIT branch-on-cond vp<%cmp.n> -; CHECK-NEXT:  Successor(s): ir-bb<exit>, scalar.ph -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<exit>: -; CHECK-NEXT:    IR   %red.next.lcssa = phi i64 [ %red.next, %loop ] (extra operand: vp<%11> from middle.block) -; CHECK-NEXT:  No successors -; CHECK-EMPTY: -; CHECK-NEXT:  scalar.ph: -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.resume.val> = phi [ vp<%4>, middle.block ], [ ir<%start>, ir-bb<entry> ] -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.merge.rdx> = phi [ vp<%11>, middle.block ], [ ir<0>, ir-bb<entry> ] -; CHECK-NEXT:  Successor(s): ir-bb<loop> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<loop>: -; CHECK-NEXT:    IR   %ptr.iv = phi ptr [ %start, %entry ], [ %gep.iv.next, %loop ] (extra operand: vp<%bc.resume.val> from scalar.ph) -; CHECK-NEXT:    IR   %red = phi i64 [ 0, %entry ], [ %red.next, %loop ] (extra operand: vp<%bc.merge.rdx> from scalar.ph) -; CHECK-NEXT:    IR   %l = load i8, ptr %ptr.iv, align 1 -; CHECK-NEXT:    IR   %l.ext = sext i8 %l to i32 -; CHECK-NEXT:    IR   %mul = mul i32 %l.ext, 128 -; CHECK-NEXT:    IR   %mul.ext = sext i32 %mul to i64 -; CHECK-NEXT:    IR   %red.next = add i64 %red, %mul.ext -; CHECK-NEXT:    IR   %gep.iv.next = getelementptr i8, ptr %ptr.iv, i64 1 -; CHECK-NEXT:    IR   %ec = icmp eq ptr %ptr.iv, %end -; CHECK-NEXT:  No successors -; CHECK-NEXT:  } -; CHECK:       VPlan 'Final VPlan for VF={4},UF={1}' { -; CHECK-NEXT:  Live-in ir<%1> = original trip-count -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<entry>: -; CHECK-NEXT:    IR   %start2 = ptrtoint ptr %start to i64 -; CHECK-NEXT:    IR   %end1 = ptrtoint ptr %end to i64 -; CHECK-NEXT:    IR   %0 = add i64 %end1, 1 -; CHECK-NEXT:    IR   %1 = sub i64 %0, %start2 -; CHECK-NEXT:    EMIT vp<%min.iters.check> = icmp ult ir<%1>, ir<4> -; CHECK-NEXT:    EMIT branch-on-cond vp<%min.iters.check> -; CHECK-NEXT:  Successor(s): ir-bb<scalar.ph>, vector.ph -; CHECK-EMPTY: -; CHECK-NEXT:  vector.ph: -; CHECK-NEXT:    EMIT vp<%n.mod.vf> = urem ir<%1>, ir<4> -; CHECK-NEXT:    EMIT vp<%n.vec> = sub ir<%1>, vp<%n.mod.vf> -; CHECK-NEXT:    vp<%3> = DERIVED-IV ir<%start> + vp<%n.vec> * ir<1> -; CHECK-NEXT:  Successor(s): vector.body -; CHECK-EMPTY: -; CHECK-NEXT:  vector.body: -; CHECK-NEXT:    EMIT-SCALAR vp<%index> = phi [ ir<0>, vector.ph ], [ vp<%index.next>, vector.body ] -; CHECK-NEXT:    WIDEN-REDUCTION-PHI ir<%red> = phi ir<0>, ir<%red.next> -; CHECK-NEXT:    EMIT vp<%next.gep> = ptradd ir<%start>, vp<%index> -; CHECK-NEXT:    WIDEN ir<%l> = load vp<%next.gep> -; CHECK-NEXT:    WIDEN-CAST ir<%l.ext> = sext ir<%l> to i32 -; CHECK-NEXT:    WIDEN ir<%mul> = mul ir<%l.ext>, ir<128> -; CHECK-NEXT:    WIDEN-CAST ir<%mul.ext> = sext ir<%mul> to i64 -; CHECK-NEXT:    REDUCE ir<%red.next> = ir<%red> +  reduce.add (ir<%mul.ext>) -; CHECK-NEXT:    EMIT vp<%index.next> = add nuw vp<%index>, ir<4> -; CHECK-NEXT:    EMIT branch-on-count vp<%index.next>, vp<%n.vec> -; CHECK-NEXT:  Successor(s): middle.block, vector.body -; CHECK-EMPTY: -; CHECK-NEXT:  middle.block: -; CHECK-NEXT:    EMIT vp<%5> = compute-reduction-result ir<%red>, ir<%red.next> -; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq ir<%1>, vp<%n.vec> +; CHECK-NEXT:    EMIT vp<%11> = compute-reduction-result ir<[[RDX]]>, vp<[[RDX_NEXT]]> +; CHECK-NEXT:    EMIT vp<%cmp.n> = icmp eq vp<%3>, vp<[[VTC]]>  ; CHECK-NEXT:    EMIT branch-on-cond vp<%cmp.n> -; CHECK-NEXT:  Successor(s): ir-bb<exit>, ir-bb<scalar.ph> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<exit>: -; CHECK-NEXT:    IR   %red.next.lcssa = phi i64 [ %red.next, %loop ] (extra operand: vp<%5> from middle.block) -; CHECK-NEXT:  No successors -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<scalar.ph>: -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.resume.val> = phi [ vp<%3>, middle.block ], [ ir<%start>, ir-bb<entry> ] -; CHECK-NEXT:    EMIT-SCALAR vp<%bc.merge.rdx> = phi [ vp<%5>, middle.block ], [ ir<0>, ir-bb<entry> ] -; CHECK-NEXT:  Successor(s): ir-bb<loop> -; CHECK-EMPTY: -; CHECK-NEXT:  ir-bb<loop>: -; CHECK-NEXT:    IR   %ptr.iv = phi ptr [ %start, %scalar.ph ], [ %gep.iv.next, %loop ] (extra operand: vp<%bc.resume.val> from ir-bb<scalar.ph>) -; CHECK-NEXT:    IR   %red = phi i64 [ 0, %scalar.ph ], [ %red.next, %loop ] (extra operand: vp<%bc.merge.rdx> from ir-bb<scalar.ph>) -; CHECK-NEXT:    IR   %l = load i8, ptr %ptr.iv, align 1 -; CHECK-NEXT:    IR   %l.ext = sext i8 %l to i32 -; CHECK-NEXT:    IR   %mul = mul i32 %l.ext, 128 -; CHECK-NEXT:    IR   %mul.ext = sext i32 %mul to i64 -; CHECK-NEXT:    IR   %red.next = add i64 %red, %mul.ext -; CHECK-NEXT:    IR   %gep.iv.next = getelementptr i8, ptr %ptr.iv, i64 1 -; CHECK-NEXT:    IR   %ec = icmp eq ptr %ptr.iv, %end -; CHECK-NEXT:  No successors -; CHECK-NEXT:  }  entry:    br label %loop diff --git a/llvm/test/Transforms/PGOProfile/memprof_diff_inline.ll b/llvm/test/Transforms/PGOProfile/memprof_diff_inline.ll new file mode 100644 index 0000000..5213a07 --- /dev/null +++ b/llvm/test/Transforms/PGOProfile/memprof_diff_inline.ll @@ -0,0 +1,118 @@ +;; Tests that the compiler ignores smaller contexts that differ only in the +;; IsInlineFrame bool. These map to the same full context id internally, as we +;; ignore the inline frame status which may differ in feedback compiles. +;; Presumably this happens when profiles collected from different binaries are +;; merged. If we didn't pick the largest we would default them all to noncold. + +;; Avoid failures on big-endian systems that can't read the profile properly +; REQUIRES: x86_64-linux + +;; Generate the profile and the IR. +; RUN: split-file %s %t + +;; Generate indexed profile +; RUN: llvm-profdata merge %t/memprof_diff_inline.yaml -o %t.memprofdata + +; RUN: opt < %t/memprof_diff_inline.ll -passes='memprof-use<profile-filename=%t.memprofdata>' -S -memprof-report-hinted-sizes -memprof-print-match-info 2>&1 | FileCheck %s --check-prefixes=MEMPROF + +; MEMPROF: MemProf notcold context with id 10194276560488437434 has total profiled size 200 is matched with 1 frames +; MEMPROF: MemProf cold context with id 16342802530253093571 has total profiled size 10000 is matched with 1 frames + +;--- memprof_diff_inline.yaml +--- +HeapProfileRecords: +  - GUID:            _Z3foov +    AllocSites: +      # Small non-cold, full context id 16342802530253093571, should ignore +      - Callstack: +          - { Function: _Z3foov, LineOffset: 1, Column: 10, IsInlineFrame: false } +          - { Function: _Z4foo2v, LineOffset: 1, Column: 10, IsInlineFrame: false } +          - { Function: _Z3barv, LineOffset: 1, Column: 10, IsInlineFrame: false } +          - { Function: main, LineOffset: 8, Column: 13, IsInlineFrame: false } +        MemInfoBlock: +          AllocCount:      1 +          TotalSize:       10 +          TotalLifetime:   0 +          TotalLifetimeAccessDensity: 20000 +      # Large cold, full context id 16342802530253093571, should keep +      - Callstack: +          - { Function: _Z3foov, LineOffset: 1, Column: 10, IsInlineFrame: false } +          - { Function: _Z4foo2v, LineOffset: 1, Column: 10, IsInlineFrame: true } +          - { Function: _Z3barv, LineOffset: 1, Column: 10, IsInlineFrame: false } +          - { Function: main, LineOffset: 8, Column: 13, IsInlineFrame: false } +        MemInfoBlock: +          AllocCount:      1 +          TotalSize:       10000 +          TotalLifetime:   200000 +          TotalLifetimeAccessDensity: 0 +      # Small non-cold, full context id 16342802530253093571, should ignore +      - Callstack: +          - { Function: _Z3foov, LineOffset: 1, Column: 10, IsInlineFrame: false } +          - { Function: _Z4foo2v, LineOffset: 1, Column: 10, IsInlineFrame: false } +          - { Function: _Z3barv, LineOffset: 1, Column: 10, IsInlineFrame: true } +          - { Function: main, LineOffset: 8, Column: 13, IsInlineFrame: false } +        MemInfoBlock: +          AllocCount:      1 +          TotalSize:       100 +          TotalLifetime:   0 +          TotalLifetimeAccessDensity: 20000 +      # Small non-cold, full context id 10194276560488437434 +      - Callstack: +          - { Function: _Z3foov, LineOffset: 1, Column: 10, IsInlineFrame: false } +          - { Function: _Z4foo2v, LineOffset: 1, Column: 10, IsInlineFrame: false } +          - { Function: _Z3barv, LineOffset: 1, Column: 10, IsInlineFrame: false } +          - { Function: main, LineOffset: 9, Column: 13, IsInlineFrame: false } +        MemInfoBlock: +          AllocCount:      1 +          TotalSize:       200 +          TotalLifetime:   0 +          TotalLifetimeAccessDensity: 20000 +    CallSites:       [] +... +;--- memprof_diff_inline.ll +; ModuleID = 'memprof_diff_inline.cc' +source_filename = "memprof_diff_inline.cc" +target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128" +target triple = "x86_64-unknown-linux-gnu" + +%"struct.std::nothrow_t" = type { i8 } + +@_ZSt7nothrow = external global %"struct.std::nothrow_t", align 1 + +define dso_local noundef ptr @_Z3foov() !dbg !10 { +entry: +  ; MEMPROF: call {{.*}} @_Znwm{{.*}} !memprof ![[M1:[0-9]+]], !callsite ![[C1:[0-9]+]] +  %call = call noalias noundef align 32 ptr @_Znwm(i64 noundef 32) #6, !dbg !13 +  ret ptr %call +} + +declare noundef ptr @_Znwm(i64 noundef) + +attributes #6 = { builtin allocsize(0) } + +; MEMPROF: ![[M1]] = !{![[MIB1:[0-9]+]], ![[MIB2:[0-9]+]]} + +; MEMPROF: ![[MIB1]] = !{![[STACK1:[0-9]+]], !"notcold", ![[CONTEXTSIZE1:[0-9]+]]} +; MEMPROF: ![[STACK1]] = !{i64 2732490490862098848, i64 8467819354083268568, i64 9086428284934609951, i64 2061451396820446691} +;; Full context id 10194276560488437434 == -8252467513221114182 +; MEMPROF: ![[CONTEXTSIZE1]] = !{i64 -8252467513221114182, i64 200} + +; MEMPROF: ![[MIB2]] = !{![[STACK2:[0-9]+]], !"cold", ![[CONTEXTSIZE2:[0-9]+]]} +; MEMPROF: ![[STACK2]] = !{i64 2732490490862098848, i64 8467819354083268568, i64 9086428284934609951, i64 -5747251260480066785} +;; Full context id 16342802530253093571 == -2103941543456458045 +;; We should have kept the large (cold) one. +; MEMPROF: ![[CONTEXTSIZE2]] = !{i64 -2103941543456458045, i64 10000} + +; MEMPROF: ![[C1]] = !{i64 2732490490862098848} + +!llvm.dbg.cu = !{!0} +!llvm.module.flags = !{!2, !3} + +!0 = distinct !DICompileUnit(language: DW_LANG_C_plus_plus_14, file: !1, producer: "clang version 15.0.0 (https://github.com/llvm/llvm-project.git 6cbe6284d1f0a088b5c6482ae27b738f03d82fe7)", isOptimized: false, runtimeVersion: 0, emissionKind: LineTablesOnly, splitDebugInlining: false, debugInfoForProfiling: true, nameTableKind: None) +!1 = !DIFile(filename: "memprof.cc", directory: "/usr/local/google/home/tejohnson/llvm/tmp", checksumkind: CSK_MD5, checksum: "e8c40ebe4b21776b4d60e9632cbc13c2") +!2 = !{i32 7, !"Dwarf Version", i32 5} +!3 = !{i32 2, !"Debug Info Version", i32 3} +!10 = distinct !DISubprogram(name: "foo", linkageName: "_Z3foov", scope: !1, file: !1, line: 4, type: !11, scopeLine: 4, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !12) +!11 = !DISubroutineType(types: !12) +!12 = !{} +!13 = !DILocation(line: 5, column: 10, scope: !10) diff --git a/llvm/test/Transforms/PGOProfile/memprof_loop_unroll.ll b/llvm/test/Transforms/PGOProfile/memprof_loop_unroll.ll index 2461ca3..ba53c57 100644 --- a/llvm/test/Transforms/PGOProfile/memprof_loop_unroll.ll +++ b/llvm/test/Transforms/PGOProfile/memprof_loop_unroll.ll @@ -4,24 +4,50 @@  ;; Avoid failures on big-endian systems that can't read the profile properly  ; REQUIRES: x86_64-linux -;; TODO: Use text profile inputs once that is available for memprof. -;; # To update the Inputs below, run Inputs/update_memprof_inputs.sh. -;; # To generate below LLVM IR for use in matching. -;; $ clang++ -gmlt -fdebug-info-for-profiling -S %S/Inputs/memprof_loop_unroll_b.cc -emit-llvm +; Generate the profile and the IR. +; RUN: split-file %s %t + +;; Generate indexed profile +; RUN: llvm-profdata merge %t/memprof_loop_unroll.yaml -o %t.memprofdata -; RUN: llvm-profdata merge %S/Inputs/memprof_loop_unroll.memprofraw --profiled-binary %S/Inputs/memprof_loop_unroll.exe -o %t.memprofdata  ;; Set the minimum lifetime threshold to 0 to ensure that one context is  ;; considered cold (the other will be notcold). -; RUN: opt < %s -passes='memprof-use<profile-filename=%t.memprofdata>' -S -memprof-report-hinted-sizes -memprof-ave-lifetime-cold-threshold=0 2>&1 | FileCheck %s +; RUN: opt < %t/memprof_loop_unroll.ll -passes='memprof-use<profile-filename=%t.memprofdata>' -S -memprof-report-hinted-sizes -memprof-ave-lifetime-cold-threshold=0 2>&1 | FileCheck %s -;; Conservatively annotate as not cold. We get two messages as there are two -;; unrolled copies of the allocation. -; CHECK: MemProf hinting: Total size for full allocation context hash {{.*}} and indistinguishable alloc type notcold: 4 -; CHECK: MemProf hinting: Total size for full allocation context hash {{.*}} and indistinguishable alloc type notcold: 4 +;; Conservatively annotate as not cold. +; CHECK: MemProf hinting: Total size for full allocation context hash {{.*}} and single alloc type notcold: 4  ; CHECK: call {{.*}} @_Znam{{.*}} #[[ATTR:[0-9]+]]  ; CHECK: attributes #[[ATTR]] = { builtin allocsize(0) "memprof"="notcold" }  ; CHECK-NOT: stackIds: () +;--- memprof_loop_unroll.yaml +--- +HeapProfileRecords: +  - GUID:            0x7f8d88fcc70a347b +    AllocSites: +      - Callstack: +          - { Function: 0x7f8d88fcc70a347b, LineOffset: 2, Column: 16, IsInlineFrame: false } +          - { Function: 0xdb956436e78dd5fa, LineOffset: 1, Column: 5, IsInlineFrame: false } +        MemInfoBlock: +          AllocCount:      1 +          TotalSize:       4 +          TotalLifetime:   2 +          TotalLifetimeAccessDensity: 12500000000 +      - Callstack: +          - { Function: 0x7f8d88fcc70a347b, LineOffset: 2, Column: 16, IsInlineFrame: false } +          - { Function: 0xdb956436e78dd5fa, LineOffset: 1, Column: 5, IsInlineFrame: false } +        MemInfoBlock: +          AllocCount:      1 +          TotalSize:       4 +          TotalLifetime:   2 +          TotalLifetimeAccessDensity: 0 +  - GUID:            0xdb956436e78dd5fa +    CallSites: +      - Frames: +          - { Function: 0xdb956436e78dd5fa, LineOffset: 1, Column: 5, IsInlineFrame: false } +... + +;--- memprof_loop_unroll.ll  ; ModuleID = 'memprof_loop_unroll_b.cc'  source_filename = "memprof_loop_unroll_b.cc"  target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128" diff --git a/llvm/test/Transforms/SLPVectorizer/X86/alternate-opcode-strict-bitwidth-than-main.ll b/llvm/test/Transforms/SLPVectorizer/X86/alternate-opcode-strict-bitwidth-than-main.ll new file mode 100644 index 0000000..959b235 --- /dev/null +++ b/llvm/test/Transforms/SLPVectorizer/X86/alternate-opcode-strict-bitwidth-than-main.ll @@ -0,0 +1,36 @@ +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6 +; RUN: opt -passes=slp-vectorizer -S -slp-threshold=-99999 -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s + +define float @test(i8 %0) { +; CHECK-LABEL: define float @test( +; CHECK-SAME: i8 [[TMP0:%.*]]) { +; CHECK-NEXT:  [[ENTRY:.*:]] +; CHECK-NEXT:    [[TMP1:%.*]] = insertelement <2 x i8> <i8 poison, i8 0>, i8 [[TMP0]], i32 0 +; CHECK-NEXT:    [[TMP2:%.*]] = sext <2 x i8> [[TMP1]] to <2 x i32> +; CHECK-NEXT:    [[TMP3:%.*]] = mul <2 x i32> [[TMP2]], <i32 2, i32 27> +; CHECK-NEXT:    [[TMP4:%.*]] = lshr <2 x i32> [[TMP2]], <i32 2, i32 27> +; CHECK-NEXT:    [[TMP5:%.*]] = shufflevector <2 x i32> [[TMP3]], <2 x i32> [[TMP4]], <2 x i32> <i32 0, i32 3> +; CHECK-NEXT:    [[TMP6:%.*]] = extractelement <2 x i32> [[TMP5]], i32 0 +; CHECK-NEXT:    [[TMP7:%.*]] = extractelement <2 x i32> [[TMP5]], i32 1 +; CHECK-NEXT:    [[TMP8:%.*]] = or i32 [[TMP6]], [[TMP7]] +; CHECK-NEXT:    switch i32 [[TMP8]], label %[[EXIT:.*]] [ +; CHECK-NEXT:      i32 0, label %[[EXIT]] +; CHECK-NEXT:      i32 1, label %[[EXIT]] +; CHECK-NEXT:    ] +; CHECK:       [[EXIT]]: +; CHECK-NEXT:    ret float 0.000000e+00 +; +entry: +  %1 = sext i8 0 to i32 +  %2 = lshr i32 %1, 27 +  %3 = sext i8 %0 to i32 +  %reass.add.epil = mul i32 %3, 2 +  %4 = or i32 %reass.add.epil, %2 +  switch i32 %4, label %exit [ +  i32 0, label %exit +  i32 1, label %exit +  ] + +exit: +  ret float 0.000000e+00 +} diff --git a/llvm/test/Transforms/SimplifyCFG/X86/switch-of-powers-of-two.ll b/llvm/test/Transforms/SimplifyCFG/X86/switch-of-powers-of-two.ll index aa95b3f..d818335 100644 --- a/llvm/test/Transforms/SimplifyCFG/X86/switch-of-powers-of-two.ll +++ b/llvm/test/Transforms/SimplifyCFG/X86/switch-of-powers-of-two.ll @@ -1,8 +1,13 @@ -; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5 +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals all --version 5  ; RUN: opt -passes='simplifycfg<switch-to-lookup>' -simplifycfg-require-and-preserve-domtree=1 -S < %s | FileCheck %s  target triple = "x86_64-unknown-linux-gnu" +;. +; CHECK: @switch.table.switch_of_powers_two = private unnamed_addr constant [7 x i32] [i32 3, i32 poison, i32 poison, i32 2, i32 1, i32 0, i32 42], align 4 +; CHECK: @switch.table.switch_of_powers_two_default_reachable = private unnamed_addr constant [7 x i32] [i32 3, i32 5, i32 5, i32 2, i32 1, i32 0, i32 42], align 4 +; CHECK: @switch.table.switch_of_powers_two_default_reachable_multipreds = private unnamed_addr constant [7 x i32] [i32 3, i32 poison, i32 poison, i32 2, i32 1, i32 0, i32 42], align 4 +;.  define i32 @switch_of_powers_two(i32 %arg) {  ; CHECK-LABEL: define i32 @switch_of_powers_two(  ; CHECK-SAME: i32 [[ARG:%.*]]) { @@ -35,17 +40,17 @@ return:    ret i32 %phi  } -define i32 @switch_of_powers_two_default_reachable(i32 %arg) { +define i32 @switch_of_powers_two_default_reachable(i32 %arg) !prof !0 {  ; CHECK-LABEL: define i32 @switch_of_powers_two_default_reachable( -; CHECK-SAME: i32 [[ARG:%.*]]) { +; CHECK-SAME: i32 [[ARG:%.*]]) !prof [[PROF0:![0-9]+]] {  ; CHECK-NEXT:  [[ENTRY:.*]]:  ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @llvm.ctpop.i32(i32 [[ARG]])  ; CHECK-NEXT:    [[TMP1:%.*]] = icmp eq i32 [[TMP0]], 1 -; CHECK-NEXT:    br i1 [[TMP1]], label %[[ENTRY_SPLIT:.*]], label %[[RETURN:.*]] +; CHECK-NEXT:    br i1 [[TMP1]], label %[[ENTRY_SPLIT:.*]], label %[[RETURN:.*]], !prof [[PROF1:![0-9]+]]  ; CHECK:       [[ENTRY_SPLIT]]:  ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @llvm.cttz.i32(i32 [[ARG]], i1 true)  ; CHECK-NEXT:    [[TMP3:%.*]] = icmp ult i32 [[TMP2]], 7 -; CHECK-NEXT:    br i1 [[TMP3]], label %[[SWITCH_LOOKUP:.*]], label %[[RETURN]] +; CHECK-NEXT:    br i1 [[TMP3]], label %[[SWITCH_LOOKUP:.*]], label %[[RETURN]], !prof [[PROF2:![0-9]+]]  ; CHECK:       [[SWITCH_LOOKUP]]:  ; CHECK-NEXT:    [[TMP4:%.*]] = zext nneg i32 [[TMP2]] to i64  ; CHECK-NEXT:    [[SWITCH_GEP:%.*]] = getelementptr inbounds [7 x i32], ptr @switch.table.switch_of_powers_two_default_reachable, i64 0, i64 [[TMP4]] @@ -62,7 +67,7 @@ entry:    i32 16, label %bb3    i32 32, label %bb4    i32 64, label %bb5 -  ] +  ], !prof !1  default_case: br label %return  bb1: br label %return @@ -128,3 +133,13 @@ return:    %phi = phi i32 [ 3, %bb1 ], [ 2, %bb2 ], [ 1, %bb3 ], [ 0, %bb4 ], [ 42, %bb5 ], [ %pn, %default_case ]    ret i32 %phi  } + +!0 = !{!"function_entry_count", i32 10} +!1 = !{!"branch_weights", i32 10, i32 5, i32 7, i32 11, i32 13, i32 17} +;. +; CHECK: attributes #[[ATTR0:[0-9]+]] = { nocallback nofree nosync nounwind speculatable willreturn memory(none) } +;. +; CHECK: [[PROF0]] = !{!"function_entry_count", i32 10} +; CHECK: [[PROF1]] = !{!"branch_weights", i32 58, i32 5} +; CHECK: [[PROF2]] = !{!"branch_weights", i32 56, i32 5} +;. diff --git a/llvm/test/Transforms/SimplifyCFG/pr165301.ll b/llvm/test/Transforms/SimplifyCFG/pr165301.ll new file mode 100644 index 0000000..4a539d7 --- /dev/null +++ b/llvm/test/Transforms/SimplifyCFG/pr165301.ll @@ -0,0 +1,26 @@ +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6 +; RUN: opt -S -passes="simplifycfg<switch-range-to-icmp>" < %s | FileCheck %s + +; Make sure there's no use after free when removing incoming values from PHI nodes + +define i32 @pr165301(i1 %cond) { +; CHECK-LABEL: define i32 @pr165301( +; CHECK-SAME: i1 [[COND:%.*]]) { +; CHECK-NEXT:  [[ENTRY:.*:]] +; CHECK-NEXT:    br label %[[SWITCHBB:.*]] +; CHECK:       [[SWITCHBB]]: +; CHECK-NEXT:    br label %[[SWITCHBB]] +; +entry: +  br label %switchbb + +switchbb: +  switch i1 %cond, label %default [ +  i1 false, label %switchbb +  i1 true, label %switchbb +  ] + +default: +  %phi.lcssa = phi i32 [ 0, %switchbb ] +  ret i32 %phi.lcssa +} diff --git a/llvm/test/Transforms/Util/PredicateInfo/branch-on-same-cond.ll b/llvm/test/Transforms/Util/PredicateInfo/branch-on-same-cond.ll index 0be13ee..f024106 100644 --- a/llvm/test/Transforms/Util/PredicateInfo/branch-on-same-cond.ll +++ b/llvm/test/Transforms/Util/PredicateInfo/branch-on-same-cond.ll @@ -1,4 +1,4 @@ -; NOTE: Assertions have been autogenerated by utils/update_test_checks.py +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-inst-comments  ; RUN: opt -S -passes=print-predicateinfo < %s 2>&1 >/dev/null | FileCheck %s  ; FIXME:  RenamedOp should be %cmp or %x in all cases here, @@ -9,25 +9,25 @@ define i32 @test(i32 %x) {  ; CHECK-NEXT:    br label [[BB1:%.*]]  ; CHECK:       bb1:  ; CHECK-NEXT:    [[CMP:%.*]] = icmp eq i32 [[X:%.*]], 0 -; CHECK: RenamedOp: [[CMP]] -; CHECK:         [[CMP_0:%.*]] = bitcast i1 [[CMP]] to i1 -; CHECK: RenamedOp: [[X]] -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[BB2:%.*]], label [[EXIT1:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[X]], 0 Edge: [label [[BB1]],label [[BB2:%.*]]], RenamedOp: [[CMP]] } +; CHECK-NEXT:    [[CMP_0:%.*]] = bitcast i1 [[CMP]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[X]], 0 Edge: [label [[BB1]],label [[BB2]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[BB2]], label [[EXIT1:%.*]]  ; CHECK:       bb2: -; CHECK: RenamedOp: [[CMP_0]] -; CHECK:         [[CMP_0_1:%.*]] = bitcast i1 [[CMP_0]] to i1 -; CHECK: RenamedOp: [[X]] -; CHECK:         [[X_0_1:%.*]] = bitcast i32 [[X_0]] to i32 -; CHECK: RenamedOp: [[X_0]] -; CHECK:         [[X_0_4:%.*]] = bitcast i32 [[X_0]] to i32 -; CHECK-NEXT:    br i1 [[CMP_0]], label [[BB3:%.*]], label [[EXIT2:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[X]], 0 Edge: [label [[BB2]],label [[BB3:%.*]]], RenamedOp: [[CMP_0]] } +; CHECK-NEXT:    [[CMP_0_1:%.*]] = bitcast i1 [[CMP_0]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[X]], 0 Edge: [label [[BB2]],label [[BB3]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0_1:%.*]] = bitcast i32 [[X_0]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = icmp eq i32 [[X]], 0 Edge: [label [[BB2]],label [[EXIT2:%.*]]], RenamedOp: [[X_0]] } +; CHECK-NEXT:    [[X_0_4:%.*]] = bitcast i32 [[X_0]] to i32 +; CHECK-NEXT:    br i1 [[CMP_0]], label [[BB3]], label [[EXIT2]]  ; CHECK:       bb3: -; CHECK: RenamedOp: [[X]] -; CHECK:         [[X_0_1_2:%.*]] = bitcast i32 [[X_0_1]] to i32 -; CHECK: RenamedOp: [[X_0_1]] -; CHECK:         [[X_0_1_3:%.*]] = bitcast i32 [[X_0_1]] to i32 -; CHECK-NEXT:    br i1 [[CMP_0_1]], label [[EXIT3:%.*]], label [[EXIT4:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[X]], 0 Edge: [label [[BB3]],label [[EXIT3:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0_1_2:%.*]] = bitcast i32 [[X_0_1]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = icmp eq i32 [[X]], 0 Edge: [label [[BB3]],label [[EXIT4:%.*]]], RenamedOp: [[X_0_1]] } +; CHECK-NEXT:    [[X_0_1_3:%.*]] = bitcast i32 [[X_0_1]] to i32 +; CHECK-NEXT:    br i1 [[CMP_0_1]], label [[EXIT3]], label [[EXIT4]]  ; CHECK:       exit1:  ; CHECK-NEXT:    ret i32 0  ; CHECK:       exit2: diff --git a/llvm/test/Transforms/Util/PredicateInfo/condprop.ll b/llvm/test/Transforms/Util/PredicateInfo/condprop.ll index 256d0d9..42e8ccb 100644 --- a/llvm/test/Transforms/Util/PredicateInfo/condprop.ll +++ b/llvm/test/Transforms/Util/PredicateInfo/condprop.ll @@ -1,4 +1,4 @@ -; NOTE: Assertions have been autogenerated by utils/update_test_checks.py +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-inst-comments  ; RUN: opt -passes=print-predicateinfo -disable-output < %s 2>&1 | FileCheck %s  @a = external global i32		; <ptr> [#uses=7] @@ -98,12 +98,17 @@ define void @test3(i32 %x, i32 %y) {  ; CHECK-NEXT:    [[XZ:%.*]] = icmp eq i32 [[X:%.*]], 0  ; CHECK-NEXT:    [[YZ:%.*]] = icmp eq i32 [[Y:%.*]], 0  ; CHECK-NEXT:    [[Z:%.*]] = and i1 [[XZ]], [[YZ]] -; CHECK:         [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 -; CHECK:         [[XZ_0:%.*]] = bitcast i1 [[XZ]] to i1 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[YZ_0:%.*]] = bitcast i1 [[YZ]] to i1 -; CHECK:         [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 -; CHECK-NEXT:    br i1 [[Z]], label [[BOTH_ZERO:%.*]], label [[NOPE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[Z]] = and i1 [[XZ]], [[YZ]] Edge: [label [[TMP0:%.*]],label [[NOPE:%.*]]], RenamedOp: [[Z]] } +; CHECK-NEXT:    [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH_ZERO:%.*]]], RenamedOp: [[XZ]] } +; CHECK-NEXT:    [[XZ_0:%.*]] = bitcast i1 [[XZ]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH_ZERO]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[BOTH_ZERO]]], RenamedOp: [[YZ]] } +; CHECK-NEXT:    [[YZ_0:%.*]] = bitcast i1 [[YZ]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[BOTH_ZERO]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 +; CHECK-NEXT:    br i1 [[Z]], label [[BOTH_ZERO]], label [[NOPE]]  ; CHECK:       both_zero:  ; CHECK-NEXT:    call void @foo(i1 [[XZ_0]])  ; CHECK-NEXT:    call void @foo(i1 [[YZ_0]]) @@ -133,10 +138,11 @@ define void @test4(i1 %b, i32 %x) {  ; CHECK-LABEL: @test4(  ; CHECK-NEXT:    br i1 [[B:%.*]], label [[SW:%.*]], label [[CASE3:%.*]]  ; CHECK:       sw: -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X:%.*]] to i32 +; CHECK-NEXT:  ; switch predicate info { CaseValue: i32 1 Edge: [label [[SW]],label [[CASE1:%.*]]], RenamedOp: [[X:%.*]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32  ; CHECK-NEXT:    switch i32 [[X]], label [[DEFAULT:%.*]] [  ; CHECK-NEXT:      i32 0, label [[CASE0:%.*]] -; CHECK-NEXT:      i32 1, label [[CASE1:%.*]] +; CHECK-NEXT:      i32 1, label [[CASE1]]  ; CHECK-NEXT:      i32 2, label [[CASE0]]  ; CHECK-NEXT:      i32 3, label [[CASE3]]  ; CHECK-NEXT:      i32 4, label [[DEFAULT]] @@ -180,11 +186,15 @@ case3:  define i1 @test5(i32 %x, i32 %y) {  ; CHECK-LABEL: @test5(  ; CHECK-NEXT:    [[CMP:%.*]] = icmp eq i32 [[X:%.*]], [[Y:%.*]] -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[X_1:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 -; CHECK:         [[Y_1:%.*]] = bitcast i32 [[Y]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[SAME:%.*]], label [[DIFFERENT:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[X]], [[Y]] Edge: [label [[TMP0:%.*]],label [[SAME:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = icmp eq i32 [[X]], [[Y]] Edge: [label [[TMP0]],label [[DIFFERENT:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_1:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[X]], [[Y]] Edge: [label [[TMP0]],label [[SAME]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = icmp eq i32 [[X]], [[Y]] Edge: [label [[TMP0]],label [[DIFFERENT]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_1:%.*]] = bitcast i32 [[Y]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[SAME]], label [[DIFFERENT]]  ; CHECK:       same:  ; CHECK-NEXT:    [[CMP2:%.*]] = icmp ne i32 [[X_0]], [[Y_0]]  ; CHECK-NEXT:    ret i1 [[CMP2]] @@ -253,11 +263,15 @@ different:  define i1 @test7(i32 %x, i32 %y) {  ; CHECK-LABEL: @test7(  ; CHECK-NEXT:    [[CMP:%.*]] = icmp sgt i32 [[X:%.*]], [[Y:%.*]] -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[X_1:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 -; CHECK:         [[Y_1:%.*]] = bitcast i32 [[Y]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[SAME:%.*]], label [[DIFFERENT:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp sgt i32 [[X]], [[Y]] Edge: [label [[TMP0:%.*]],label [[SAME:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = icmp sgt i32 [[X]], [[Y]] Edge: [label [[TMP0]],label [[DIFFERENT:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_1:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp sgt i32 [[X]], [[Y]] Edge: [label [[TMP0]],label [[SAME]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = icmp sgt i32 [[X]], [[Y]] Edge: [label [[TMP0]],label [[DIFFERENT]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_1:%.*]] = bitcast i32 [[Y]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[SAME]], label [[DIFFERENT]]  ; CHECK:       same:  ; CHECK-NEXT:    [[CMP2:%.*]] = icmp sle i32 [[X_0]], [[Y_0]]  ; CHECK-NEXT:    ret i1 [[CMP2]] @@ -280,11 +294,15 @@ different:  define i1 @test7_fp(float %x, float %y) {  ; CHECK-LABEL: @test7_fp(  ; CHECK-NEXT:    [[CMP:%.*]] = fcmp ogt float [[X:%.*]], [[Y:%.*]] -; CHECK:         [[X_0:%.*]] = bitcast float [[X]] to float -; CHECK:         [[X_1:%.*]] = bitcast float [[X]] to float -; CHECK:         [[Y_0:%.*]] = bitcast float [[Y]] to float -; CHECK:         [[Y_1:%.*]] = bitcast float [[Y]] to float -; CHECK-NEXT:    br i1 [[CMP]], label [[SAME:%.*]], label [[DIFFERENT:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = fcmp ogt float [[X]], [[Y]] Edge: [label [[TMP0:%.*]],label [[SAME:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast float [[X]] to float +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = fcmp ogt float [[X]], [[Y]] Edge: [label [[TMP0]],label [[DIFFERENT:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_1:%.*]] = bitcast float [[X]] to float +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = fcmp ogt float [[X]], [[Y]] Edge: [label [[TMP0]],label [[SAME]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast float [[Y]] to float +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = fcmp ogt float [[X]], [[Y]] Edge: [label [[TMP0]],label [[DIFFERENT]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_1:%.*]] = bitcast float [[Y]] to float +; CHECK-NEXT:    br i1 [[CMP]], label [[SAME]], label [[DIFFERENT]]  ; CHECK:       same:  ; CHECK-NEXT:    [[CMP2:%.*]] = fcmp ule float [[X_0]], [[Y_0]]  ; CHECK-NEXT:    ret i1 [[CMP2]] @@ -353,9 +371,11 @@ different:  define i32 @test9(i32 %i, i32 %j) {  ; CHECK-LABEL: @test9(  ; CHECK-NEXT:    [[CMP:%.*]] = icmp eq i32 [[I:%.*]], [[J:%.*]] -; CHECK:         [[I_0:%.*]] = bitcast i32 [[I]] to i32 -; CHECK:         [[J_0:%.*]] = bitcast i32 [[J]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[COND_TRUE:%.*]], label [[RET:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[I]], [[J]] Edge: [label [[TMP0:%.*]],label [[COND_TRUE:%.*]]], RenamedOp: [[I]] } +; CHECK-NEXT:    [[I_0:%.*]] = bitcast i32 [[I]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[I]], [[J]] Edge: [label [[TMP0]],label [[COND_TRUE]]], RenamedOp: [[J]] } +; CHECK-NEXT:    [[J_0:%.*]] = bitcast i32 [[J]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[COND_TRUE]], label [[RET:%.*]]  ; CHECK:       cond_true:  ; CHECK-NEXT:    [[DIFF:%.*]] = sub i32 [[I_0]], [[J_0]]  ; CHECK-NEXT:    ret i32 [[DIFF]] @@ -376,9 +396,11 @@ ret:  define i32 @test10(i32 %j, i32 %i) {  ; CHECK-LABEL: @test10(  ; CHECK-NEXT:    [[CMP:%.*]] = icmp eq i32 [[I:%.*]], [[J:%.*]] -; CHECK:         [[I_0:%.*]] = bitcast i32 [[I]] to i32 -; CHECK:         [[J_0:%.*]] = bitcast i32 [[J]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[COND_TRUE:%.*]], label [[RET:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[I]], [[J]] Edge: [label [[TMP0:%.*]],label [[COND_TRUE:%.*]]], RenamedOp: [[I]] } +; CHECK-NEXT:    [[I_0:%.*]] = bitcast i32 [[I]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[I]], [[J]] Edge: [label [[TMP0]],label [[COND_TRUE]]], RenamedOp: [[J]] } +; CHECK-NEXT:    [[J_0:%.*]] = bitcast i32 [[J]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[COND_TRUE]], label [[RET:%.*]]  ; CHECK:       cond_true:  ; CHECK-NEXT:    [[DIFF:%.*]] = sub i32 [[I_0]], [[J_0]]  ; CHECK-NEXT:    ret i32 [[DIFF]] @@ -403,15 +425,18 @@ define i32 @test11(i32 %x) {  ; CHECK-NEXT:    [[V0:%.*]] = call i32 @yogibar()  ; CHECK-NEXT:    [[V1:%.*]] = call i32 @yogibar()  ; CHECK-NEXT:    [[CMP:%.*]] = icmp eq i32 [[V0]], [[V1]] -; CHECK:         [[V0_0:%.*]] = bitcast i32 [[V0]] to i32 -; CHECK:         [[V1_0:%.*]] = bitcast i32 [[V1]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[COND_TRUE:%.*]], label [[NEXT:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = icmp eq i32 [[V0]], [[V1]] Edge: [label [[TMP0:%.*]],label [[NEXT:%.*]]], RenamedOp: [[V0]] } +; CHECK-NEXT:    [[V0_0:%.*]] = bitcast i32 [[V0]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[V0]], [[V1]] Edge: [label [[TMP0]],label [[COND_TRUE:%.*]]], RenamedOp: [[V1]] } +; CHECK-NEXT:    [[V1_0:%.*]] = bitcast i32 [[V1]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[COND_TRUE]], label [[NEXT]]  ; CHECK:       cond_true:  ; CHECK-NEXT:    ret i32 [[V1_0]]  ; CHECK:       next:  ; CHECK-NEXT:    [[CMP2:%.*]] = icmp eq i32 [[X:%.*]], [[V0_0]] -; CHECK:         [[V0_0_1:%.*]] = bitcast i32 [[V0_0]] to i32 -; CHECK-NEXT:    br i1 [[CMP2]], label [[COND_TRUE2:%.*]], label [[NEXT2:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP2]] = icmp eq i32 [[X]], [[V0_0]] Edge: [label [[NEXT]],label [[COND_TRUE2:%.*]]], RenamedOp: [[V0_0]] } +; CHECK-NEXT:    [[V0_0_1:%.*]] = bitcast i32 [[V0_0]] to i32 +; CHECK-NEXT:    br i1 [[CMP2]], label [[COND_TRUE2]], label [[NEXT2:%.*]]  ; CHECK:       cond_true2:  ; CHECK-NEXT:    ret i32 [[V0_0_1]]  ; CHECK:       next2: @@ -439,9 +464,11 @@ next2:  define i32 @test12(i32 %x) {  ; CHECK-LABEL: @test12(  ; CHECK-NEXT:    [[CMP:%.*]] = icmp eq i32 [[X:%.*]], 0 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[X_1:%.*]] = bitcast i32 [[X]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0:%.*]],label [[COND_TRUE:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[COND_FALSE:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_1:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[COND_TRUE]], label [[COND_FALSE]]  ; CHECK:       cond_true:  ; CHECK-NEXT:    br label [[RET:%.*]]  ; CHECK:       cond_false: diff --git a/llvm/test/Transforms/Util/PredicateInfo/diamond.ll b/llvm/test/Transforms/Util/PredicateInfo/diamond.ll index ac2c9a1..06c02d6 100644 --- a/llvm/test/Transforms/Util/PredicateInfo/diamond.ll +++ b/llvm/test/Transforms/Util/PredicateInfo/diamond.ll @@ -1,16 +1,18 @@ -; NOTE: Assertions have been autogenerated by utils/update_test_checks.py -; RUN: opt -passes=print-predicateinfo < %s 2>&1 | FileCheck %s +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-inst-comments +; RUN: opt -passes=print-predicateinfo -disable-output < %s 2>&1 | FileCheck %s  define i1 @f(i32 %x, i1 %y) {  ; CHECK-LABEL: @f(  ; CHECK-NEXT:    br i1 [[Y:%.*]], label [[BB0:%.*]], label [[BB1:%.*]]  ; CHECK:       bb0:  ; CHECK-NEXT:    [[CMP:%.*]] = icmp sge i32 [[X:%.*]], 0 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[BB2:%.*]], label [[BB3:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp sge i32 [[X]], 0 Edge: [label [[BB0]],label [[BB2:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[BB2]], label [[BB3:%.*]]  ; CHECK:       bb1:  ; CHECK-NEXT:    [[X2:%.*]] = add nuw nsw i32 [[X]], 1  ; CHECK-NEXT:    [[CMP2:%.*]] = icmp sge i32 [[X2]], 2 -; CHECK:         [[X2_0:%.*]] = bitcast i32 [[X2]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP2]] = icmp sge i32 [[X2]], 2 Edge: [label [[BB1]],label [[BB2]]], RenamedOp: [[X2]] } +; CHECK-NEXT:    [[X2_0:%.*]] = bitcast i32 [[X2]] to i32  ; CHECK-NEXT:    br i1 [[CMP2]], label [[BB2]], label [[BB3]]  ; CHECK:       bb2:  ; CHECK-NEXT:    [[X3:%.*]] = phi i32 [ [[X_0]], [[BB0]] ], [ [[X2_0]], [[BB1]] ] @@ -38,12 +40,14 @@ define i1 @g(i32 %x, i1 %y) {  ; CHECK-NEXT:    br i1 [[Y:%.*]], label [[BB0:%.*]], label [[BB1:%.*]]  ; CHECK:       bb0:  ; CHECK-NEXT:    [[CMP:%.*]] = icmp sge i32 [[X:%.*]], 0 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[BB3:%.*]], label [[BB2:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = icmp sge i32 [[X]], 0 Edge: [label [[BB0]],label [[BB2:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[BB3:%.*]], label [[BB2]]  ; CHECK:       bb1:  ; CHECK-NEXT:    [[X2:%.*]] = add nuw nsw i32 [[X]], 1  ; CHECK-NEXT:    [[CMP2:%.*]] = icmp sge i32 [[X2]], 2 -; CHECK:         [[X2_0:%.*]] = bitcast i32 [[X2]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP2]] = icmp sge i32 [[X2]], 2 Edge: [label [[BB1]],label [[BB2]]], RenamedOp: [[X2]] } +; CHECK-NEXT:    [[X2_0:%.*]] = bitcast i32 [[X2]] to i32  ; CHECK-NEXT:    br i1 [[CMP2]], label [[BB3]], label [[BB2]]  ; CHECK:       bb2:  ; CHECK-NEXT:    [[X3:%.*]] = phi i32 [ [[X_0]], [[BB0]] ], [ [[X2_0]], [[BB1]] ] diff --git a/llvm/test/Transforms/Util/PredicateInfo/edge.ll b/llvm/test/Transforms/Util/PredicateInfo/edge.ll index ef757f3..9138326 100644 --- a/llvm/test/Transforms/Util/PredicateInfo/edge.ll +++ b/llvm/test/Transforms/Util/PredicateInfo/edge.ll @@ -1,16 +1,17 @@ -; NOTE: Assertions have been autogenerated by utils/update_test_checks.py -; RUN: opt -passes=print-predicateinfo < %s 2>&1 | FileCheck %s +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-inst-comments +; RUN: opt -passes=print-predicateinfo -disable-output < %s 2>&1 | FileCheck %s  define i32 @f1(i32 %x) {  ; CHECK-LABEL: @f1(  ; CHECK-NEXT:  bb0:  ; CHECK-NEXT:    [[CMP:%.*]] = icmp eq i32 [[X:%.*]], 0 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[BB2:%.*]], label [[BB1:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = icmp eq i32 [[X]], 0 Edge: [label [[BB0:%.*]],label [[BB2:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[BB2]], label [[BB1:%.*]]  ; CHECK:       bb1:  ; CHECK-NEXT:    br label [[BB2]]  ; CHECK:       bb2: -; CHECK-NEXT:    [[COND:%.*]] = phi i32 [ [[X_0]], [[BB0:%.*]] ], [ 0, [[BB1]] ] +; CHECK-NEXT:    [[COND:%.*]] = phi i32 [ [[X_0]], [[BB0]] ], [ 0, [[BB1]] ]  ; CHECK-NEXT:    [[FOO:%.*]] = add i32 [[COND]], [[X]]  ; CHECK-NEXT:    ret i32 [[FOO]]  ; @@ -29,12 +30,13 @@ define i32 @f2(i32 %x) {  ; CHECK-LABEL: @f2(  ; CHECK-NEXT:  bb0:  ; CHECK-NEXT:    [[CMP:%.*]] = icmp ne i32 [[X:%.*]], 0 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK-NEXT:    br i1 [[CMP]], label [[BB1:%.*]], label [[BB2:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = icmp ne i32 [[X]], 0 Edge: [label [[BB0:%.*]],label [[BB2:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:    br i1 [[CMP]], label [[BB1:%.*]], label [[BB2]]  ; CHECK:       bb1:  ; CHECK-NEXT:    br label [[BB2]]  ; CHECK:       bb2: -; CHECK-NEXT:    [[COND:%.*]] = phi i32 [ [[X_0]], [[BB0:%.*]] ], [ 0, [[BB1]] ] +; CHECK-NEXT:    [[COND:%.*]] = phi i32 [ [[X_0]], [[BB0]] ], [ 0, [[BB1]] ]  ; CHECK-NEXT:    [[FOO:%.*]] = add i32 [[COND]], [[X]]  ; CHECK-NEXT:    ret i32 [[FOO]]  ; @@ -52,14 +54,15 @@ bb2:  define i32 @f3(i32 %x) {  ; CHECK-LABEL: @f3(  ; CHECK-NEXT:  bb0: -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X:%.*]] to i32 +; CHECK-NEXT:  ; switch predicate info { CaseValue: i32 0 Edge: [label [[BB0:%.*]],label [[BB2:%.*]]], RenamedOp: [[X:%.*]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32  ; CHECK-NEXT:    switch i32 [[X]], label [[BB1:%.*]] [ -; CHECK-NEXT:    i32 0, label [[BB2:%.*]] +; CHECK-NEXT:      i32 0, label [[BB2]]  ; CHECK-NEXT:    ]  ; CHECK:       bb1:  ; CHECK-NEXT:    br label [[BB2]]  ; CHECK:       bb2: -; CHECK-NEXT:    [[COND:%.*]] = phi i32 [ [[X_0]], [[BB0:%.*]] ], [ 0, [[BB1]] ] +; CHECK-NEXT:    [[COND:%.*]] = phi i32 [ [[X_0]], [[BB0]] ], [ 0, [[BB1]] ]  ; CHECK-NEXT:    [[FOO:%.*]] = add i32 [[COND]], [[X]]  ; CHECK-NEXT:    ret i32 [[FOO]]  ; @@ -78,13 +81,14 @@ define double @fcmp_oeq_not_zero(double %x, double %y) {  ; CHECK-LABEL: @fcmp_oeq_not_zero(  ; CHECK-NEXT:  entry:  ; CHECK-NEXT:    [[CMP:%.*]] = fcmp oeq double [[Y:%.*]], 2.000000e+00 -; CHECK:         [[Y_0:%.*]] = bitcast double [[Y]] to double -; CHECK-NEXT:    br i1 [[CMP]], label [[IF:%.*]], label [[RETURN:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = fcmp oeq double [[Y]], 2.000000e+00 Edge: [label [[ENTRY:%.*]],label [[IF:%.*]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast double [[Y]] to double +; CHECK-NEXT:    br i1 [[CMP]], label [[IF]], label [[RETURN:%.*]]  ; CHECK:       if:  ; CHECK-NEXT:    [[DIV:%.*]] = fdiv double [[X:%.*]], [[Y_0]]  ; CHECK-NEXT:    br label [[RETURN]]  ; CHECK:       return: -; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[IF]] ], [ [[X]], [[ENTRY:%.*]] ] +; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[IF]] ], [ [[X]], [[ENTRY]] ]  ; CHECK-NEXT:    ret double [[RETVAL]]  ;  entry: @@ -105,13 +109,14 @@ define double @fcmp_une_not_zero(double %x, double %y) {  ; CHECK-LABEL: @fcmp_une_not_zero(  ; CHECK-NEXT:  entry:  ; CHECK-NEXT:    [[CMP:%.*]] = fcmp une double [[Y:%.*]], 2.000000e+00 -; CHECK:         [[Y_0:%.*]] = bitcast double [[Y]] to double -; CHECK-NEXT:    br i1 [[CMP]], label [[RETURN:%.*]], label [[ELSE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = fcmp une double [[Y]], 2.000000e+00 Edge: [label [[ENTRY:%.*]],label [[ELSE:%.*]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast double [[Y]] to double +; CHECK-NEXT:    br i1 [[CMP]], label [[RETURN:%.*]], label [[ELSE]]  ; CHECK:       else:  ; CHECK-NEXT:    [[DIV:%.*]] = fdiv double [[X:%.*]], [[Y_0]]  ; CHECK-NEXT:    br label [[RETURN]]  ; CHECK:       return: -; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[ELSE]] ], [ [[X]], [[ENTRY:%.*]] ] +; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[ELSE]] ], [ [[X]], [[ENTRY]] ]  ; CHECK-NEXT:    ret double [[RETVAL]]  ;  entry: @@ -132,13 +137,14 @@ define double @fcmp_oeq_zero(double %x, double %y) {  ; CHECK-LABEL: @fcmp_oeq_zero(  ; CHECK-NEXT:  entry:  ; CHECK-NEXT:    [[CMP:%.*]] = fcmp oeq double [[Y:%.*]], 0.000000e+00 -; CHECK:         [[Y_0:%.*]] = bitcast double [[Y]] to double -; CHECK-NEXT:    br i1 [[CMP]], label [[IF:%.*]], label [[RETURN:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = fcmp oeq double [[Y]], 0.000000e+00 Edge: [label [[ENTRY:%.*]],label [[IF:%.*]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast double [[Y]] to double +; CHECK-NEXT:    br i1 [[CMP]], label [[IF]], label [[RETURN:%.*]]  ; CHECK:       if:  ; CHECK-NEXT:    [[DIV:%.*]] = fdiv double [[X:%.*]], [[Y_0]]  ; CHECK-NEXT:    br label [[RETURN]]  ; CHECK:       return: -; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[IF]] ], [ [[X]], [[ENTRY:%.*]] ] +; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[IF]] ], [ [[X]], [[ENTRY]] ]  ; CHECK-NEXT:    ret double [[RETVAL]]  ;  entry: @@ -159,13 +165,14 @@ define double @fcmp_une_zero(double %x, double %y) {  ; CHECK-LABEL: @fcmp_une_zero(  ; CHECK-NEXT:  entry:  ; CHECK-NEXT:    [[CMP:%.*]] = fcmp une double [[Y:%.*]], -0.000000e+00 -; CHECK:         [[Y_0:%.*]] = bitcast double [[Y]] to double -; CHECK-NEXT:    br i1 [[CMP]], label [[RETURN:%.*]], label [[ELSE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = fcmp une double [[Y]], -0.000000e+00 Edge: [label [[ENTRY:%.*]],label [[ELSE:%.*]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast double [[Y]] to double +; CHECK-NEXT:    br i1 [[CMP]], label [[RETURN:%.*]], label [[ELSE]]  ; CHECK:       else:  ; CHECK-NEXT:    [[DIV:%.*]] = fdiv double [[X:%.*]], [[Y_0]]  ; CHECK-NEXT:    br label [[RETURN]]  ; CHECK:       return: -; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[ELSE]] ], [ [[X]], [[ENTRY:%.*]] ] +; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[ELSE]] ], [ [[X]], [[ENTRY]] ]  ; CHECK-NEXT:    ret double [[RETVAL]]  ;  entry: @@ -188,13 +195,14 @@ define double @fcmp_oeq_maybe_zero(double %x, double %y, double %z1, double %z2)  ; CHECK-NEXT:  entry:  ; CHECK-NEXT:    [[Z:%.*]] = fadd double [[Z1:%.*]], [[Z2:%.*]]  ; CHECK-NEXT:    [[CMP:%.*]] = fcmp oeq double [[Y:%.*]], [[Z]] -; CHECK:         [[Z_0:%.*]] = bitcast double [[Z]] to double -; CHECK-NEXT:    br i1 [[CMP]], label [[IF:%.*]], label [[RETURN:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[CMP]] = fcmp oeq double [[Y]], [[Z]] Edge: [label [[ENTRY:%.*]],label [[IF:%.*]]], RenamedOp: [[Z]] } +; CHECK-NEXT:    [[Z_0:%.*]] = bitcast double [[Z]] to double +; CHECK-NEXT:    br i1 [[CMP]], label [[IF]], label [[RETURN:%.*]]  ; CHECK:       if:  ; CHECK-NEXT:    [[DIV:%.*]] = fdiv double [[X:%.*]], [[Z_0]]  ; CHECK-NEXT:    br label [[RETURN]]  ; CHECK:       return: -; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[IF]] ], [ [[X]], [[ENTRY:%.*]] ] +; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[IF]] ], [ [[X]], [[ENTRY]] ]  ; CHECK-NEXT:    ret double [[RETVAL]]  ;  entry: @@ -217,13 +225,14 @@ define double @fcmp_une_maybe_zero(double %x, double %y, double %z1, double %z2)  ; CHECK-NEXT:  entry:  ; CHECK-NEXT:    [[Z:%.*]] = fadd double [[Z1:%.*]], [[Z2:%.*]]  ; CHECK-NEXT:    [[CMP:%.*]] = fcmp une double [[Y:%.*]], [[Z]] -; CHECK:         [[Z_0:%.*]] = bitcast double [[Z]] to double -; CHECK-NEXT:    br i1 [[CMP]], label [[RETURN:%.*]], label [[ELSE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[CMP]] = fcmp une double [[Y]], [[Z]] Edge: [label [[ENTRY:%.*]],label [[ELSE:%.*]]], RenamedOp: [[Z]] } +; CHECK-NEXT:    [[Z_0:%.*]] = bitcast double [[Z]] to double +; CHECK-NEXT:    br i1 [[CMP]], label [[RETURN:%.*]], label [[ELSE]]  ; CHECK:       else:  ; CHECK-NEXT:    [[DIV:%.*]] = fdiv double [[X:%.*]], [[Z_0]]  ; CHECK-NEXT:    br label [[RETURN]]  ; CHECK:       return: -; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[ELSE]] ], [ [[X]], [[ENTRY:%.*]] ] +; CHECK-NEXT:    [[RETVAL:%.*]] = phi double [ [[DIV]], [[ELSE]] ], [ [[X]], [[ENTRY]] ]  ; CHECK-NEXT:    ret double [[RETVAL]]  ;  entry: diff --git a/llvm/test/Transforms/Util/PredicateInfo/pr33456.ll b/llvm/test/Transforms/Util/PredicateInfo/pr33456.ll index 36eaf6e..4762d37 100644 --- a/llvm/test/Transforms/Util/PredicateInfo/pr33456.ll +++ b/llvm/test/Transforms/Util/PredicateInfo/pr33456.ll @@ -1,5 +1,5 @@ -; NOTE: Assertions have been autogenerated by utils/update_test_checks.py -; RUN: opt -passes=print-predicateinfo < %s 2>&1 | FileCheck %s +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-inst-comments +; RUN: opt -passes=print-predicateinfo -disable-output < %s 2>&1 | FileCheck %s  ; Don't insert predicate info for conditions with a single target.  @a = global i32 1, align 4  @d = common global i32 0, align 4 @@ -12,22 +12,27 @@ define i32 @main() {  ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, ptr @d, align 4  ; CHECK-NEXT:    [[TMP2:%.*]] = icmp eq i32 [[TMP1]], 0  ; CHECK-NEXT:    br i1 [[TMP2]], label [[TMP3:%.*]], label [[TMP13:%.*]] -; CHECK:         [[TMP4:%.*]] = load i32, ptr @a, align 4 +; CHECK:       3: +; CHECK-NEXT:    [[TMP4:%.*]] = load i32, ptr @a, align 4  ; CHECK-NEXT:    [[TMP5:%.*]] = load i32, ptr @c, align 4  ; CHECK-NEXT:    [[TMP6:%.*]] = icmp slt i32 [[TMP5]], 1  ; CHECK-NEXT:    br i1 [[TMP6]], label [[TMP7:%.*]], label [[TMP9:%.*]] -; CHECK:         [[TMP8:%.*]] = icmp eq i32 [[TMP4]], 0 +; CHECK:       7: +; CHECK-NEXT:    [[TMP8:%.*]] = icmp eq i32 [[TMP4]], 0  ; CHECK-NEXT:    br i1 [[TMP8]], label [[TMP9]], label [[TMP9]] -; CHECK:         [[DOT0:%.*]] = phi i32 [ [[TMP4]], [[TMP7]] ], [ [[TMP4]], [[TMP7]] ], [ [[DOT1:%.*]], [[TMP13]] ], [ [[TMP4]], [[TMP3]] ] +; CHECK:       9: +; CHECK-NEXT:    [[DOT0:%.*]] = phi i32 [ [[TMP4]], [[TMP7]] ], [ [[TMP4]], [[TMP7]] ], [ [[DOT1:%.*]], [[TMP13]] ], [ [[TMP4]], [[TMP3]] ]  ; CHECK-NEXT:    [[TMP10:%.*]] = load i32, ptr @b, align 4  ; CHECK-NEXT:    [[TMP11:%.*]] = sdiv i32 [[TMP10]], [[DOT0]]  ; CHECK-NEXT:    [[TMP12:%.*]] = icmp eq i32 [[TMP11]], 0  ; CHECK-NEXT:    br i1 [[TMP12]], label [[TMP13]], label [[TMP13]] -; CHECK:         [[DOT1]] = phi i32 [ [[DOT0]], [[TMP9]] ], [ [[DOT0]], [[TMP9]] ], [ undef, [[TMP0:%.*]] ] +; CHECK:       13: +; CHECK-NEXT:    [[DOT1]] = phi i32 [ [[DOT0]], [[TMP9]] ], [ [[DOT0]], [[TMP9]] ], [ undef, [[TMP0:%.*]] ]  ; CHECK-NEXT:    [[TMP14:%.*]] = load i32, ptr @e, align 4  ; CHECK-NEXT:    [[TMP15:%.*]] = icmp eq i32 [[TMP14]], 0  ; CHECK-NEXT:    br i1 [[TMP15]], label [[TMP16:%.*]], label [[TMP9]] -; CHECK:         ret i32 0 +; CHECK:       16: +; CHECK-NEXT:    ret i32 0  ;    %1 = load i32, ptr @d, align 4    %2 = icmp eq i32 %1, 0 diff --git a/llvm/test/Transforms/Util/PredicateInfo/pr33457.ll b/llvm/test/Transforms/Util/PredicateInfo/pr33457.ll index bc1d39f..e4fd4cc 100644 --- a/llvm/test/Transforms/Util/PredicateInfo/pr33457.ll +++ b/llvm/test/Transforms/Util/PredicateInfo/pr33457.ll @@ -1,5 +1,5 @@ -; NOTE: Assertions have been autogenerated by utils/update_test_checks.py -; RUN: opt -passes=print-predicateinfo < %s 2>&1 | FileCheck %s +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-inst-comments +; RUN: opt -passes=print-predicateinfo -disable-output < %s 2>&1 | FileCheck %s  ; Don't insert predicate info for conditions with a single target.  @a = global i32 6, align 4  @c = global i32 -1, align 4 @@ -13,26 +13,32 @@ define i32 @main() {  ; CHECK-LABEL: @main(  ; CHECK-NEXT:    store i32 6, ptr @e, align 4  ; CHECK-NEXT:    br label [[TMP1:%.*]] -; CHECK:         [[TMP2:%.*]] = load i32, ptr @d, align 4 +; CHECK:       1: +; CHECK-NEXT:    [[TMP2:%.*]] = load i32, ptr @d, align 4  ; CHECK-NEXT:    [[TMP3:%.*]] = sext i32 [[TMP2]] to i64  ; CHECK-NEXT:    [[TMP4:%.*]] = getelementptr inbounds [6 x i32], ptr @b, i64 0, i64 [[TMP3]]  ; CHECK-NEXT:    [[TMP5:%.*]] = load i32, ptr [[TMP4]], align 4  ; CHECK-NEXT:    [[TMP6:%.*]] = call i32 (ptr, ...) @printf(ptr @.str, i32 [[TMP5]])  ; CHECK-NEXT:    [[TMP7:%.*]] = load i32, ptr @a, align 4  ; CHECK-NEXT:    [[TMP8:%.*]] = icmp eq i32 [[TMP7]], 0 -; CHECK-NEXT:    br i1 [[TMP8]], label %thread-pre-split, label [[TMP9:%.*]] -; CHECK:         [[TMP10:%.*]] = load i32, ptr @e, align 4 +; CHECK-NEXT:    br i1 [[TMP8]], label [[THREAD_PRE_SPLIT:%.*]], label [[TMP9:%.*]] +; CHECK:       9: +; CHECK-NEXT:    [[TMP10:%.*]] = load i32, ptr @e, align 4  ; CHECK-NEXT:    [[TMP11:%.*]] = icmp eq i32 [[TMP10]], 0  ; CHECK-NEXT:    br i1 [[TMP11]], label [[TMP12:%.*]], label [[TMP12]]  ; CHECK:       thread-pre-split:  ; CHECK-NEXT:    [[DOTPR:%.*]] = load i32, ptr @e, align 4  ; CHECK-NEXT:    br label [[TMP12]] -; CHECK:         [[TMP13:%.*]] = phi i32 [ [[DOTPR]], %thread-pre-split ], [ [[TMP10]], [[TMP9]] ], [ [[TMP10]], [[TMP9]] ] +; CHECK:       12: +; CHECK-NEXT:    [[TMP13:%.*]] = phi i32 [ [[DOTPR]], [[THREAD_PRE_SPLIT]] ], [ [[TMP10]], [[TMP9]] ], [ [[TMP10]], [[TMP9]] ]  ; CHECK-NEXT:    [[TMP14:%.*]] = icmp ne i32 [[TMP13]], 0  ; CHECK-NEXT:    br i1 [[TMP14]], label [[TMP15:%.*]], label [[TMP15]] -; CHECK:         br i1 [[TMP14]], label [[TMP16:%.*]], label [[TMP17:%.*]] -; CHECK:         br label [[TMP17]] -; CHECK:         [[DOT0:%.*]] = phi i32 [ 1, [[TMP16]] ], [ -1, [[TMP15]] ] +; CHECK:       15: +; CHECK-NEXT:    br i1 [[TMP14]], label [[TMP16:%.*]], label [[TMP17:%.*]] +; CHECK:       16: +; CHECK-NEXT:    br label [[TMP17]] +; CHECK:       17: +; CHECK-NEXT:    [[DOT0:%.*]] = phi i32 [ 1, [[TMP16]] ], [ -1, [[TMP15]] ]  ; CHECK-NEXT:    [[TMP18:%.*]] = and i32 [[DOT0]], 8693  ; CHECK-NEXT:    [[TMP19:%.*]] = load i32, ptr @c, align 4  ; CHECK-NEXT:    [[TMP20:%.*]] = xor i32 [[TMP18]], [[TMP19]] @@ -40,7 +46,8 @@ define i32 @main() {  ; CHECK-NEXT:    store i32 [[TMP21]], ptr @d, align 4  ; CHECK-NEXT:    [[TMP22:%.*]] = icmp slt i32 [[TMP20]], -2  ; CHECK-NEXT:    br i1 [[TMP22]], label [[TMP1]], label [[TMP23:%.*]] -; CHECK:         ret i32 0 +; CHECK:       23: +; CHECK-NEXT:    ret i32 0  ;    store i32 6, ptr @e, align 4    br label %1 diff --git a/llvm/test/Transforms/Util/PredicateInfo/testandor.ll b/llvm/test/Transforms/Util/PredicateInfo/testandor.ll index cc1dc4e..d29aadd 100644 --- a/llvm/test/Transforms/Util/PredicateInfo/testandor.ll +++ b/llvm/test/Transforms/Util/PredicateInfo/testandor.ll @@ -1,4 +1,4 @@ -; NOTE: Assertions have been autogenerated by utils/update_test_checks.py +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-inst-comments  ; RUN: opt -passes=print-predicateinfo -disable-output < %s 2>&1 | FileCheck %s  declare void @foo(i1) @@ -10,12 +10,17 @@ define void @test_or(i32 %x, i32 %y) {  ; CHECK-NEXT:    [[XZ:%.*]] = icmp eq i32 [[X:%.*]], 0  ; CHECK-NEXT:    [[YZ:%.*]] = icmp eq i32 [[Y:%.*]], 0  ; CHECK-NEXT:    [[Z:%.*]] = or i1 [[XZ]], [[YZ]] -; CHECK:         [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 -; CHECK:         [[XZ_0:%.*]] = bitcast i1 [[XZ]] to i1 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[YZ_0:%.*]] = bitcast i1 [[YZ]] to i1 -; CHECK:         [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 -; CHECK-NEXT:    br i1 [[Z]], label [[ONEOF:%.*]], label [[NEITHER:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[Z]] = or i1 [[XZ]], [[YZ]] Edge: [label [[TMP0:%.*]],label [[NEITHER:%.*]]], RenamedOp: [[Z]] } +; CHECK-NEXT:    [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[NEITHER]]], RenamedOp: [[XZ]] } +; CHECK-NEXT:    [[XZ_0:%.*]] = bitcast i1 [[XZ]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[NEITHER]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[NEITHER]]], RenamedOp: [[YZ]] } +; CHECK-NEXT:    [[YZ_0:%.*]] = bitcast i1 [[YZ]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[NEITHER]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 +; CHECK-NEXT:    br i1 [[Z]], label [[ONEOF:%.*]], label [[NEITHER]]  ; CHECK:       oneof:  ; CHECK-NEXT:    call void @foo(i1 [[XZ]])  ; CHECK-NEXT:    call void @foo(i1 [[YZ]]) @@ -55,12 +60,17 @@ define void @test_or_logical(i32 %x, i32 %y) {  ; CHECK-NEXT:    [[XZ:%.*]] = icmp eq i32 [[X:%.*]], 0  ; CHECK-NEXT:    [[YZ:%.*]] = icmp eq i32 [[Y:%.*]], 0  ; CHECK-NEXT:    [[Z:%.*]] = select i1 [[XZ]], i1 true, i1 [[YZ]] -; CHECK:         [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 -; CHECK:         [[XZ_0:%.*]] = bitcast i1 [[XZ]] to i1 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[YZ_0:%.*]] = bitcast i1 [[YZ]] to i1 -; CHECK:         [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 -; CHECK-NEXT:    br i1 [[Z]], label [[ONEOF:%.*]], label [[NEITHER:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[Z]] = select i1 [[XZ]], i1 true, i1 [[YZ]] Edge: [label [[TMP0:%.*]],label [[NEITHER:%.*]]], RenamedOp: [[Z]] } +; CHECK-NEXT:    [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[NEITHER]]], RenamedOp: [[XZ]] } +; CHECK-NEXT:    [[XZ_0:%.*]] = bitcast i1 [[XZ]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[NEITHER]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[NEITHER]]], RenamedOp: [[YZ]] } +; CHECK-NEXT:    [[YZ_0:%.*]] = bitcast i1 [[YZ]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[NEITHER]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 +; CHECK-NEXT:    br i1 [[Z]], label [[ONEOF:%.*]], label [[NEITHER]]  ; CHECK:       oneof:  ; CHECK-NEXT:    call void @foo(i1 [[XZ]])  ; CHECK-NEXT:    call void @foo(i1 [[YZ]]) @@ -100,12 +110,17 @@ define void @test_and(i32 %x, i32 %y) {  ; CHECK-NEXT:    [[XZ:%.*]] = icmp eq i32 [[X:%.*]], 0  ; CHECK-NEXT:    [[YZ:%.*]] = icmp eq i32 [[Y:%.*]], 0  ; CHECK-NEXT:    [[Z:%.*]] = and i1 [[XZ]], [[YZ]] -; CHECK:         [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 -; CHECK:         [[XZ_0:%.*]] = bitcast i1 [[XZ]] to i1 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[YZ_0:%.*]] = bitcast i1 [[YZ]] to i1 -; CHECK:         [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 -; CHECK-NEXT:    br i1 [[Z]], label [[BOTH:%.*]], label [[NOPE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[Z]] = and i1 [[XZ]], [[YZ]] Edge: [label [[TMP0:%.*]],label [[NOPE:%.*]]], RenamedOp: [[Z]] } +; CHECK-NEXT:    [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH:%.*]]], RenamedOp: [[XZ]] } +; CHECK-NEXT:    [[XZ_0:%.*]] = bitcast i1 [[XZ]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[YZ]] } +; CHECK-NEXT:    [[YZ_0:%.*]] = bitcast i1 [[YZ]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 +; CHECK-NEXT:    br i1 [[Z]], label [[BOTH]], label [[NOPE]]  ; CHECK:       both:  ; CHECK-NEXT:    call void @foo(i1 [[XZ_0]])  ; CHECK-NEXT:    call void @foo(i1 [[YZ_0]]) @@ -145,12 +160,17 @@ define void @test_and_logical(i32 %x, i32 %y) {  ; CHECK-NEXT:    [[XZ:%.*]] = icmp eq i32 [[X:%.*]], 0  ; CHECK-NEXT:    [[YZ:%.*]] = icmp eq i32 [[Y:%.*]], 0  ; CHECK-NEXT:    [[Z:%.*]] = select i1 [[XZ]], i1 [[YZ]], i1 false -; CHECK:         [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 -; CHECK:         [[XZ_0:%.*]] = bitcast i1 [[XZ]] to i1 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[YZ_0:%.*]] = bitcast i1 [[YZ]] to i1 -; CHECK:         [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 -; CHECK-NEXT:    br i1 [[Z]], label [[BOTH:%.*]], label [[NOPE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[Z]] = select i1 [[XZ]], i1 [[YZ]], i1 false Edge: [label [[TMP0:%.*]],label [[NOPE:%.*]]], RenamedOp: [[Z]] } +; CHECK-NEXT:    [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH:%.*]]], RenamedOp: [[XZ]] } +; CHECK-NEXT:    [[XZ_0:%.*]] = bitcast i1 [[XZ]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[YZ]] } +; CHECK-NEXT:    [[YZ_0:%.*]] = bitcast i1 [[YZ]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[Y_0:%.*]] = bitcast i32 [[Y]] to i32 +; CHECK-NEXT:    br i1 [[Z]], label [[BOTH]], label [[NOPE]]  ; CHECK:       both:  ; CHECK-NEXT:    call void @foo(i1 [[XZ_0]])  ; CHECK-NEXT:    call void @foo(i1 [[YZ_0]]) @@ -190,12 +210,17 @@ define void @testandsame(i32 %x, i32 %y) {  ; CHECK-NEXT:    [[XGT:%.*]] = icmp sgt i32 [[X:%.*]], 0  ; CHECK-NEXT:    [[XLT:%.*]] = icmp slt i32 [[X]], 100  ; CHECK-NEXT:    [[Z:%.*]] = and i1 [[XGT]], [[XLT]] -; CHECK:         [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 -; CHECK:         [[XGT_0:%.*]] = bitcast i1 [[XGT]] to i1 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[X_0_1:%.*]] = bitcast i32 [[X_0]] to i32 -; CHECK:         [[XLT_0:%.*]] = bitcast i1 [[XLT]] to i1 -; CHECK-NEXT:    br i1 [[Z]], label [[BOTH:%.*]], label [[NOPE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[Z]] = and i1 [[XGT]], [[XLT]] Edge: [label [[TMP0:%.*]],label [[NOPE:%.*]]], RenamedOp: [[Z]] } +; CHECK-NEXT:    [[Z_0:%.*]] = bitcast i1 [[Z]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XGT]] = icmp sgt i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH:%.*]]], RenamedOp: [[XGT]] } +; CHECK-NEXT:    [[XGT_0:%.*]] = bitcast i1 [[XGT]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XGT]] = icmp sgt i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XLT]] = icmp slt i32 [[X]], 100 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0_1:%.*]] = bitcast i32 [[X_0]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XLT]] = icmp slt i32 [[X]], 100 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[XLT]] } +; CHECK-NEXT:    [[XLT_0:%.*]] = bitcast i1 [[XLT]] to i1 +; CHECK-NEXT:    br i1 [[Z]], label [[BOTH]], label [[NOPE]]  ; CHECK:       both:  ; CHECK-NEXT:    call void @foo(i1 [[XGT_0]])  ; CHECK-NEXT:    call void @foo(i1 [[XLT_0]]) @@ -229,17 +254,27 @@ define void @testandassume(i32 %x, i32 %y) {  ; CHECK-NEXT:    [[YZ:%.*]] = icmp eq i32 [[Y:%.*]], 0  ; CHECK-NEXT:    [[Z:%.*]] = and i1 [[XZ]], [[YZ]]  ; CHECK-NEXT:    call void @llvm.assume(i1 [[Z]]) -; CHECK:         [[TMP1:%.*]] = bitcast i32 [[Y]] to i32 -; CHECK:         [[TMP2:%.*]] = bitcast i1 [[YZ]] to i1 -; CHECK:         [[TMP3:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[TMP4:%.*]] = bitcast i1 [[XZ]] to i1 -; CHECK:         [[TMP5:%.*]] = bitcast i1 [[Z]] to i1 -; CHECK:         [[DOT0:%.*]] = bitcast i1 [[TMP5]] to i1 -; CHECK:         [[DOT01:%.*]] = bitcast i1 [[TMP4]] to i1 -; CHECK:         [[DOT02:%.*]] = bitcast i32 [[TMP3]] to i32 -; CHECK:         [[DOT03:%.*]] = bitcast i1 [[TMP2]] to i1 -; CHECK:         [[DOT04:%.*]] = bitcast i32 [[TMP1]] to i32 -; CHECK-NEXT:    br i1 [[TMP5]], label [[BOTH:%.*]], label [[NOPE:%.*]] +; CHECK-NEXT:  ; assume predicate info { Comparison: [[YZ]] = icmp eq i32 [[Y]], 0, RenamedOp: [[Y]] } +; CHECK-NEXT:    [[TMP1:%.*]] = bitcast i32 [[Y]] to i32 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[YZ]] = icmp eq i32 [[Y]], 0, RenamedOp: [[YZ]] } +; CHECK-NEXT:    [[TMP2:%.*]] = bitcast i1 [[YZ]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[XZ]] = icmp eq i32 [[X]], 0, RenamedOp: [[X]] } +; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[XZ]] = icmp eq i32 [[X]], 0, RenamedOp: [[XZ]] } +; CHECK-NEXT:    [[TMP4:%.*]] = bitcast i1 [[XZ]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[Z]] = and i1 [[XZ]], [[YZ]], RenamedOp: [[Z]] } +; CHECK-NEXT:    [[TMP5:%.*]] = bitcast i1 [[Z]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[Z]] = and i1 [[XZ]], [[YZ]] Edge: [label [[TMP0:%.*]],label [[NOPE:%.*]]], RenamedOp: [[TMP5]] } +; CHECK-NEXT:    [[DOT0:%.*]] = bitcast i1 [[TMP5]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH:%.*]]], RenamedOp: [[XZ]] } +; CHECK-NEXT:    [[DOT01:%.*]] = bitcast i1 [[TMP4]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XZ]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[DOT02:%.*]] = bitcast i32 [[TMP3]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[YZ]] } +; CHECK-NEXT:    [[DOT03:%.*]] = bitcast i1 [[TMP2]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[YZ]] = icmp eq i32 [[Y]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[Y]] } +; CHECK-NEXT:    [[DOT04:%.*]] = bitcast i32 [[TMP1]] to i32 +; CHECK-NEXT:    br i1 [[TMP5]], label [[BOTH]], label [[NOPE]]  ; CHECK:       both:  ; CHECK-NEXT:    call void @foo(i1 [[DOT01]])  ; CHECK-NEXT:    call void @foo(i1 [[DOT03]]) @@ -274,9 +309,11 @@ define void @testorassume(i32 %x, i32 %y) {  ; CHECK-NEXT:    [[YZ:%.*]] = icmp eq i32 [[Y:%.*]], 0  ; CHECK-NEXT:    [[Z:%.*]] = or i1 [[XZ]], [[YZ]]  ; CHECK-NEXT:    call void @llvm.assume(i1 [[Z]]) -; CHECK:         [[TMP1:%.*]] = bitcast i1 [[Z]] to i1 -; CHECK:         [[DOT0:%.*]] = bitcast i1 [[TMP1]] to i1 -; CHECK-NEXT:    br i1 [[TMP1]], label [[BOTH:%.*]], label [[NOPE:%.*]] +; CHECK-NEXT:  ; assume predicate info { Comparison: [[Z]] = or i1 [[XZ]], [[YZ]], RenamedOp: [[Z]] } +; CHECK-NEXT:    [[TMP1:%.*]] = bitcast i1 [[Z]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[Z]] = or i1 [[XZ]], [[YZ]] Edge: [label [[TMP0:%.*]],label [[NOPE:%.*]]], RenamedOp: [[TMP1]] } +; CHECK-NEXT:    [[DOT0:%.*]] = bitcast i1 [[TMP1]] to i1 +; CHECK-NEXT:    br i1 [[TMP1]], label [[BOTH:%.*]], label [[NOPE]]  ; CHECK:       both:  ; CHECK-NEXT:    call void @foo(i1 [[XZ]])  ; CHECK-NEXT:    call void @foo(i1 [[YZ]]) @@ -307,12 +344,17 @@ define void @test_and_one_unknown_cond(i32 %x, i1 %c1) {  ; CHECK-LABEL: @test_and_one_unknown_cond(  ; CHECK-NEXT:    [[C2:%.*]] = icmp eq i32 [[X:%.*]], 0  ; CHECK-NEXT:    [[A:%.*]] = and i1 [[C1:%.*]], [[C2]] -; CHECK:         [[A_0:%.*]] = bitcast i1 [[A]] to i1 -; CHECK:         [[A_1:%.*]] = bitcast i1 [[A]] to i1 -; CHECK:         [[C1_0:%.*]] = bitcast i1 [[C1]] to i1 -; CHECK:         [[C2_0:%.*]] = bitcast i1 [[C2]] to i1 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK-NEXT:    br i1 [[A]], label [[BOTH:%.*]], label [[NOPE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A]] = and i1 [[C1]], [[C2]] Edge: [label [[TMP0:%.*]],label [[BOTH:%.*]]], RenamedOp: [[A]] } +; CHECK-NEXT:    [[A_0:%.*]] = bitcast i1 [[A]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A]] = and i1 [[C1]], [[C2]] Edge: [label [[TMP0]],label [[NOPE:%.*]]], RenamedOp: [[A]] } +; CHECK-NEXT:    [[A_1:%.*]] = bitcast i1 [[A]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison:i1 [[C1]] Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[C1]] } +; CHECK-NEXT:    [[C1_0:%.*]] = bitcast i1 [[C1]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[C2]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[C2]] } +; CHECK-NEXT:    [[C2_0:%.*]] = bitcast i1 [[C2]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[C2]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:    br i1 [[A]], label [[BOTH]], label [[NOPE]]  ; CHECK:       both:  ; CHECK-NEXT:    call void @bar(i32 [[X_0]])  ; CHECK-NEXT:    call void @foo(i1 [[C1_0]]) @@ -349,12 +391,17 @@ define void @test_or_one_unknown_cond(i32 %x, i1 %c1) {  ; CHECK-LABEL: @test_or_one_unknown_cond(  ; CHECK-NEXT:    [[C2:%.*]] = icmp eq i32 [[X:%.*]], 0  ; CHECK-NEXT:    [[A:%.*]] = or i1 [[C1:%.*]], [[C2]] -; CHECK:         [[A_0:%.*]] = bitcast i1 [[A]] to i1 -; CHECK:         [[A_1:%.*]] = bitcast i1 [[A]] to i1 -; CHECK:         [[C1_0:%.*]] = bitcast i1 [[C1]] to i1 -; CHECK:         [[C2_0:%.*]] = bitcast i1 [[C2]] to i1 -; CHECK:         [[X_0:%.*]] = bitcast i32 [[X]] to i32 -; CHECK-NEXT:    br i1 [[A]], label [[NOPE:%.*]], label [[BOTH_INVERTED:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A]] = or i1 [[C1]], [[C2]] Edge: [label [[TMP0:%.*]],label [[NOPE:%.*]]], RenamedOp: [[A]] } +; CHECK-NEXT:    [[A_0:%.*]] = bitcast i1 [[A]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A]] = or i1 [[C1]], [[C2]] Edge: [label [[TMP0]],label [[BOTH_INVERTED:%.*]]], RenamedOp: [[A]] } +; CHECK-NEXT:    [[A_1:%.*]] = bitcast i1 [[A]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison:i1 [[C1]] Edge: [label [[TMP0]],label [[BOTH_INVERTED]]], RenamedOp: [[C1]] } +; CHECK-NEXT:    [[C1_0:%.*]] = bitcast i1 [[C1]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[C2]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH_INVERTED]]], RenamedOp: [[C2]] } +; CHECK-NEXT:    [[C2_0:%.*]] = bitcast i1 [[C2]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[C2]] = icmp eq i32 [[X]], 0 Edge: [label [[TMP0]],label [[BOTH_INVERTED]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:    br i1 [[A]], label [[NOPE]], label [[BOTH_INVERTED]]  ; CHECK:       both_inverted:  ; CHECK-NEXT:    call void @bar(i32 [[X_0]])  ; CHECK-NEXT:    call void @foo(i1 [[C1_0]]) @@ -391,13 +438,19 @@ define void @test_and_chain(i1 %a, i1 %b, i1 %c) {  ; CHECK-LABEL: @test_and_chain(  ; CHECK-NEXT:    [[AND1:%.*]] = and i1 [[A:%.*]], [[B:%.*]]  ; CHECK-NEXT:    [[AND2:%.*]] = and i1 [[AND1]], [[C:%.*]] -; CHECK:         [[AND2_0:%.*]] = bitcast i1 [[AND2]] to i1 -; CHECK:         [[AND2_1:%.*]] = bitcast i1 [[AND2]] to i1 -; CHECK:         [[AND1_0:%.*]] = bitcast i1 [[AND1]] to i1 -; CHECK:         [[A_0:%.*]] = bitcast i1 [[A]] to i1 -; CHECK:         [[B_0:%.*]] = bitcast i1 [[B]] to i1 -; CHECK:         [[C_0:%.*]] = bitcast i1 [[C]] to i1 -; CHECK-NEXT:    br i1 [[AND2]], label [[IF:%.*]], label [[ELSE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[AND2]] = and i1 [[AND1]], [[C]] Edge: [label [[TMP0:%.*]],label [[IF:%.*]]], RenamedOp: [[AND2]] } +; CHECK-NEXT:    [[AND2_0:%.*]] = bitcast i1 [[AND2]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[AND2]] = and i1 [[AND1]], [[C]] Edge: [label [[TMP0]],label [[ELSE:%.*]]], RenamedOp: [[AND2]] } +; CHECK-NEXT:    [[AND2_1:%.*]] = bitcast i1 [[AND2]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[AND1]] = and i1 [[A]], [[B]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[AND1]] } +; CHECK-NEXT:    [[AND1_0:%.*]] = bitcast i1 [[AND1]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison:i1 [[A]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A]] } +; CHECK-NEXT:    [[A_0:%.*]] = bitcast i1 [[A]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison:i1 [[B]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[B]] } +; CHECK-NEXT:    [[B_0:%.*]] = bitcast i1 [[B]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison:i1 [[C]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[C]] } +; CHECK-NEXT:    [[C_0:%.*]] = bitcast i1 [[C]] to i1 +; CHECK-NEXT:    br i1 [[AND2]], label [[IF]], label [[ELSE]]  ; CHECK:       if:  ; CHECK-NEXT:    call void @foo(i1 [[A_0]])  ; CHECK-NEXT:    call void @foo(i1 [[B_0]]) @@ -438,13 +491,19 @@ define void @test_or_chain(i1 %a, i1 %b, i1 %c) {  ; CHECK-LABEL: @test_or_chain(  ; CHECK-NEXT:    [[OR1:%.*]] = or i1 [[A:%.*]], [[B:%.*]]  ; CHECK-NEXT:    [[OR2:%.*]] = or i1 [[OR1]], [[C:%.*]] -; CHECK:         [[OR2_0:%.*]] = bitcast i1 [[OR2]] to i1 -; CHECK:         [[OR2_1:%.*]] = bitcast i1 [[OR2]] to i1 -; CHECK:         [[OR1_0:%.*]] = bitcast i1 [[OR1]] to i1 -; CHECK:         [[A_0:%.*]] = bitcast i1 [[A]] to i1 -; CHECK:         [[B_0:%.*]] = bitcast i1 [[B]] to i1 -; CHECK:         [[C_0:%.*]] = bitcast i1 [[C]] to i1 -; CHECK-NEXT:    br i1 [[OR2]], label [[IF:%.*]], label [[ELSE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[OR2]] = or i1 [[OR1]], [[C]] Edge: [label [[TMP0:%.*]],label [[IF:%.*]]], RenamedOp: [[OR2]] } +; CHECK-NEXT:    [[OR2_0:%.*]] = bitcast i1 [[OR2]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[OR2]] = or i1 [[OR1]], [[C]] Edge: [label [[TMP0]],label [[ELSE:%.*]]], RenamedOp: [[OR2]] } +; CHECK-NEXT:    [[OR2_1:%.*]] = bitcast i1 [[OR2]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[OR1]] = or i1 [[A]], [[B]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[OR1]] } +; CHECK-NEXT:    [[OR1_0:%.*]] = bitcast i1 [[OR1]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison:i1 [[A]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[A]] } +; CHECK-NEXT:    [[A_0:%.*]] = bitcast i1 [[A]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison:i1 [[B]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[B]] } +; CHECK-NEXT:    [[B_0:%.*]] = bitcast i1 [[B]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison:i1 [[C]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[C]] } +; CHECK-NEXT:    [[C_0:%.*]] = bitcast i1 [[C]] to i1 +; CHECK-NEXT:    br i1 [[OR2]], label [[IF]], label [[ELSE]]  ; CHECK:       if:  ; CHECK-NEXT:    call void @foo(i1 [[A]])  ; CHECK-NEXT:    call void @foo(i1 [[B]]) @@ -485,11 +544,15 @@ define void @test_and_or_mixed(i1 %a, i1 %b, i1 %c) {  ; CHECK-LABEL: @test_and_or_mixed(  ; CHECK-NEXT:    [[OR:%.*]] = or i1 [[A:%.*]], [[B:%.*]]  ; CHECK-NEXT:    [[AND:%.*]] = and i1 [[OR]], [[C:%.*]] -; CHECK:         [[AND_0:%.*]] = bitcast i1 [[AND]] to i1 -; CHECK:         [[AND_1:%.*]] = bitcast i1 [[AND]] to i1 -; CHECK:         [[OR_0:%.*]] = bitcast i1 [[OR]] to i1 -; CHECK:         [[C_0:%.*]] = bitcast i1 [[C]] to i1 -; CHECK-NEXT:    br i1 [[AND]], label [[IF:%.*]], label [[ELSE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[AND]] = and i1 [[OR]], [[C]] Edge: [label [[TMP0:%.*]],label [[IF:%.*]]], RenamedOp: [[AND]] } +; CHECK-NEXT:    [[AND_0:%.*]] = bitcast i1 [[AND]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[AND]] = and i1 [[OR]], [[C]] Edge: [label [[TMP0]],label [[ELSE:%.*]]], RenamedOp: [[AND]] } +; CHECK-NEXT:    [[AND_1:%.*]] = bitcast i1 [[AND]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[OR]] = or i1 [[A]], [[B]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[OR]] } +; CHECK-NEXT:    [[OR_0:%.*]] = bitcast i1 [[OR]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison:i1 [[C]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[C]] } +; CHECK-NEXT:    [[C_0:%.*]] = bitcast i1 [[C]] to i1 +; CHECK-NEXT:    br i1 [[AND]], label [[IF]], label [[ELSE]]  ; CHECK:       if:  ; CHECK-NEXT:    call void @foo(i1 [[A]])  ; CHECK-NEXT:    call void @foo(i1 [[B]]) @@ -542,16 +605,25 @@ define void @test_deep_and_chain(i1 %a1) {  ; CHECK-NEXT:    [[A13:%.*]] = and i1 [[A12]], true  ; CHECK-NEXT:    [[A14:%.*]] = and i1 [[A13]], true  ; CHECK-NEXT:    [[A15:%.*]] = and i1 [[A14]], true -; CHECK:         [[A15_0:%.*]] = bitcast i1 [[A15]] to i1 -; CHECK:         [[A15_1:%.*]] = bitcast i1 [[A15]] to i1 -; CHECK:         [[A14_0:%.*]] = bitcast i1 [[A14]] to i1 -; CHECK:         [[A13_0:%.*]] = bitcast i1 [[A13]] to i1 -; CHECK:         [[A12_0:%.*]] = bitcast i1 [[A12]] to i1 -; CHECK:         [[A11_0:%.*]] = bitcast i1 [[A11]] to i1 -; CHECK:         [[A10_0:%.*]] = bitcast i1 [[A10]] to i1 -; CHECK:         [[A9_0:%.*]] = bitcast i1 [[A9]] to i1 -; CHECK:         [[A8_0:%.*]] = bitcast i1 [[A8]] to i1 -; CHECK-NEXT:    br i1 [[A15]], label [[IF:%.*]], label [[ELSE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A15]] = and i1 [[A14]], true Edge: [label [[TMP0:%.*]],label [[IF:%.*]]], RenamedOp: [[A15]] } +; CHECK-NEXT:    [[A15_0:%.*]] = bitcast i1 [[A15]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A15]] = and i1 [[A14]], true Edge: [label [[TMP0]],label [[ELSE:%.*]]], RenamedOp: [[A15]] } +; CHECK-NEXT:    [[A15_1:%.*]] = bitcast i1 [[A15]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A14]] = and i1 [[A13]], true Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A14]] } +; CHECK-NEXT:    [[A14_0:%.*]] = bitcast i1 [[A14]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A13]] = and i1 [[A12]], true Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A13]] } +; CHECK-NEXT:    [[A13_0:%.*]] = bitcast i1 [[A13]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A12]] = and i1 [[A11]], true Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A12]] } +; CHECK-NEXT:    [[A12_0:%.*]] = bitcast i1 [[A12]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A11]] = and i1 [[A10]], true Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A11]] } +; CHECK-NEXT:    [[A11_0:%.*]] = bitcast i1 [[A11]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A10]] = and i1 [[A9]], true Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A10]] } +; CHECK-NEXT:    [[A10_0:%.*]] = bitcast i1 [[A10]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A9]] = and i1 [[A8]], true Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A9]] } +; CHECK-NEXT:    [[A9_0:%.*]] = bitcast i1 [[A9]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A8]] = and i1 [[A7]], true Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A8]] } +; CHECK-NEXT:    [[A8_0:%.*]] = bitcast i1 [[A8]] to i1 +; CHECK-NEXT:    br i1 [[A15]], label [[IF]], label [[ELSE]]  ; CHECK:       if:  ; CHECK-NEXT:    call void @foo(i1 [[A1]])  ; CHECK-NEXT:    call void @foo(i1 [[A2]]) @@ -656,16 +728,25 @@ define void @test_deep_and_tree(i1 %a1) {  ; CHECK-NEXT:    [[A13:%.*]] = and i1 [[A12]], [[A12]]  ; CHECK-NEXT:    [[A14:%.*]] = and i1 [[A13]], [[A13]]  ; CHECK-NEXT:    [[A15:%.*]] = and i1 [[A14]], [[A14]] -; CHECK:         [[A15_0:%.*]] = bitcast i1 [[A15]] to i1 -; CHECK:         [[A15_1:%.*]] = bitcast i1 [[A15]] to i1 -; CHECK:         [[A14_0:%.*]] = bitcast i1 [[A14]] to i1 -; CHECK:         [[A13_0:%.*]] = bitcast i1 [[A13]] to i1 -; CHECK:         [[A12_0:%.*]] = bitcast i1 [[A12]] to i1 -; CHECK:         [[A11_0:%.*]] = bitcast i1 [[A11]] to i1 -; CHECK:         [[A10_0:%.*]] = bitcast i1 [[A10]] to i1 -; CHECK:         [[A9_0:%.*]] = bitcast i1 [[A9]] to i1 -; CHECK:         [[A8_0:%.*]] = bitcast i1 [[A8]] to i1 -; CHECK-NEXT:    br i1 [[A15]], label [[IF:%.*]], label [[ELSE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A15]] = and i1 [[A14]], [[A14]] Edge: [label [[TMP0:%.*]],label [[IF:%.*]]], RenamedOp: [[A15]] } +; CHECK-NEXT:    [[A15_0:%.*]] = bitcast i1 [[A15]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A15]] = and i1 [[A14]], [[A14]] Edge: [label [[TMP0]],label [[ELSE:%.*]]], RenamedOp: [[A15]] } +; CHECK-NEXT:    [[A15_1:%.*]] = bitcast i1 [[A15]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A14]] = and i1 [[A13]], [[A13]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A14]] } +; CHECK-NEXT:    [[A14_0:%.*]] = bitcast i1 [[A14]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A13]] = and i1 [[A12]], [[A12]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A13]] } +; CHECK-NEXT:    [[A13_0:%.*]] = bitcast i1 [[A13]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A12]] = and i1 [[A11]], [[A11]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A12]] } +; CHECK-NEXT:    [[A12_0:%.*]] = bitcast i1 [[A12]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A11]] = and i1 [[A10]], [[A10]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A11]] } +; CHECK-NEXT:    [[A11_0:%.*]] = bitcast i1 [[A11]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A10]] = and i1 [[A9]], [[A9]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A10]] } +; CHECK-NEXT:    [[A10_0:%.*]] = bitcast i1 [[A10]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A9]] = and i1 [[A8]], [[A8]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A9]] } +; CHECK-NEXT:    [[A9_0:%.*]] = bitcast i1 [[A9]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A8]] = and i1 [[A7]], [[A7]] Edge: [label [[TMP0]],label [[IF]]], RenamedOp: [[A8]] } +; CHECK-NEXT:    [[A8_0:%.*]] = bitcast i1 [[A8]] to i1 +; CHECK-NEXT:    br i1 [[A15]], label [[IF]], label [[ELSE]]  ; CHECK:       if:  ; CHECK-NEXT:    call void @foo(i1 [[A1]])  ; CHECK-NEXT:    call void @foo(i1 [[A2]]) @@ -770,16 +851,25 @@ define void @test_deep_or_tree(i1 %a1) {  ; CHECK-NEXT:    [[A13:%.*]] = or i1 [[A12]], [[A12]]  ; CHECK-NEXT:    [[A14:%.*]] = or i1 [[A13]], [[A13]]  ; CHECK-NEXT:    [[A15:%.*]] = or i1 [[A14]], [[A14]] -; CHECK:         [[A15_0:%.*]] = bitcast i1 [[A15]] to i1 -; CHECK:         [[A15_1:%.*]] = bitcast i1 [[A15]] to i1 -; CHECK:         [[A14_0:%.*]] = bitcast i1 [[A14]] to i1 -; CHECK:         [[A13_0:%.*]] = bitcast i1 [[A13]] to i1 -; CHECK:         [[A12_0:%.*]] = bitcast i1 [[A12]] to i1 -; CHECK:         [[A11_0:%.*]] = bitcast i1 [[A11]] to i1 -; CHECK:         [[A10_0:%.*]] = bitcast i1 [[A10]] to i1 -; CHECK:         [[A9_0:%.*]] = bitcast i1 [[A9]] to i1 -; CHECK:         [[A8_0:%.*]] = bitcast i1 [[A8]] to i1 -; CHECK-NEXT:    br i1 [[A15]], label [[IF:%.*]], label [[ELSE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[A15]] = or i1 [[A14]], [[A14]] Edge: [label [[TMP0:%.*]],label [[IF:%.*]]], RenamedOp: [[A15]] } +; CHECK-NEXT:    [[A15_0:%.*]] = bitcast i1 [[A15]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A15]] = or i1 [[A14]], [[A14]] Edge: [label [[TMP0]],label [[ELSE:%.*]]], RenamedOp: [[A15]] } +; CHECK-NEXT:    [[A15_1:%.*]] = bitcast i1 [[A15]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A14]] = or i1 [[A13]], [[A13]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[A14]] } +; CHECK-NEXT:    [[A14_0:%.*]] = bitcast i1 [[A14]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A13]] = or i1 [[A12]], [[A12]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[A13]] } +; CHECK-NEXT:    [[A13_0:%.*]] = bitcast i1 [[A13]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A12]] = or i1 [[A11]], [[A11]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[A12]] } +; CHECK-NEXT:    [[A12_0:%.*]] = bitcast i1 [[A12]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A11]] = or i1 [[A10]], [[A10]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[A11]] } +; CHECK-NEXT:    [[A11_0:%.*]] = bitcast i1 [[A11]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A10]] = or i1 [[A9]], [[A9]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[A10]] } +; CHECK-NEXT:    [[A10_0:%.*]] = bitcast i1 [[A10]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A9]] = or i1 [[A8]], [[A8]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[A9]] } +; CHECK-NEXT:    [[A9_0:%.*]] = bitcast i1 [[A9]] to i1 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 0 Comparison: [[A8]] = or i1 [[A7]], [[A7]] Edge: [label [[TMP0]],label [[ELSE]]], RenamedOp: [[A8]] } +; CHECK-NEXT:    [[A8_0:%.*]] = bitcast i1 [[A8]] to i1 +; CHECK-NEXT:    br i1 [[A15]], label [[IF]], label [[ELSE]]  ; CHECK:       if:  ; CHECK-NEXT:    call void @foo(i1 [[A1]])  ; CHECK-NEXT:    call void @foo(i1 [[A2]]) @@ -873,11 +963,16 @@ define void @test_assume_and_chain(i1 %a, i1 %b, i1 %c) {  ; CHECK-NEXT:    [[AND1:%.*]] = and i1 [[A:%.*]], [[B:%.*]]  ; CHECK-NEXT:    [[AND2:%.*]] = and i1 [[AND1]], [[C:%.*]]  ; CHECK-NEXT:    call void @llvm.assume(i1 [[AND2]]) -; CHECK:         [[TMP1:%.*]] = bitcast i1 [[C]] to i1 -; CHECK:         [[TMP2:%.*]] = bitcast i1 [[B]] to i1 -; CHECK:         [[TMP3:%.*]] = bitcast i1 [[A]] to i1 -; CHECK:         [[TMP4:%.*]] = bitcast i1 [[AND1]] to i1 -; CHECK:         [[TMP5:%.*]] = bitcast i1 [[AND2]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison:i1 [[C]], RenamedOp: [[C]] } +; CHECK-NEXT:    [[TMP1:%.*]] = bitcast i1 [[C]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison:i1 [[B]], RenamedOp: [[B]] } +; CHECK-NEXT:    [[TMP2:%.*]] = bitcast i1 [[B]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison:i1 [[A]], RenamedOp: [[A]] } +; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i1 [[A]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[AND1]] = and i1 [[A]], [[B]], RenamedOp: [[AND1]] } +; CHECK-NEXT:    [[TMP4:%.*]] = bitcast i1 [[AND1]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[AND2]] = and i1 [[AND1]], [[C]], RenamedOp: [[AND2]] } +; CHECK-NEXT:    [[TMP5:%.*]] = bitcast i1 [[AND2]] to i1  ; CHECK-NEXT:    call void @foo(i1 [[TMP3]])  ; CHECK-NEXT:    call void @foo(i1 [[TMP2]])  ; CHECK-NEXT:    call void @foo(i1 [[TMP1]]) @@ -901,7 +996,8 @@ define void @test_assume_or_chain(i1 %a, i1 %b, i1 %c) {  ; CHECK-NEXT:    [[OR1:%.*]] = or i1 [[A:%.*]], [[B:%.*]]  ; CHECK-NEXT:    [[OR2:%.*]] = or i1 [[OR1]], [[C:%.*]]  ; CHECK-NEXT:    call void @llvm.assume(i1 [[OR2]]) -; CHECK:         [[TMP1:%.*]] = bitcast i1 [[OR2]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[OR2]] = or i1 [[OR1]], [[C]], RenamedOp: [[OR2]] } +; CHECK-NEXT:    [[TMP1:%.*]] = bitcast i1 [[OR2]] to i1  ; CHECK-NEXT:    call void @foo(i1 [[A]])  ; CHECK-NEXT:    call void @foo(i1 [[B]])  ; CHECK-NEXT:    call void @foo(i1 [[C]]) @@ -937,14 +1033,22 @@ define void @test_assume_deep_and_tree(i1 %a1) {  ; CHECK-NEXT:    [[A14:%.*]] = and i1 [[A13]], [[A13]]  ; CHECK-NEXT:    [[A15:%.*]] = and i1 [[A14]], [[A14]]  ; CHECK-NEXT:    call void @llvm.assume(i1 [[A15]]) -; CHECK:         [[TMP1:%.*]] = bitcast i1 [[A8]] to i1 -; CHECK:         [[TMP2:%.*]] = bitcast i1 [[A9]] to i1 -; CHECK:         [[TMP3:%.*]] = bitcast i1 [[A10]] to i1 -; CHECK:         [[TMP4:%.*]] = bitcast i1 [[A11]] to i1 -; CHECK:         [[TMP5:%.*]] = bitcast i1 [[A12]] to i1 -; CHECK:         [[TMP6:%.*]] = bitcast i1 [[A13]] to i1 -; CHECK:         [[TMP7:%.*]] = bitcast i1 [[A14]] to i1 -; CHECK:         [[TMP8:%.*]] = bitcast i1 [[A15]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[A8]] = and i1 [[A7]], [[A7]], RenamedOp: [[A8]] } +; CHECK-NEXT:    [[TMP1:%.*]] = bitcast i1 [[A8]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[A9]] = and i1 [[A8]], [[A8]], RenamedOp: [[A9]] } +; CHECK-NEXT:    [[TMP2:%.*]] = bitcast i1 [[A9]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[A10]] = and i1 [[A9]], [[A9]], RenamedOp: [[A10]] } +; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i1 [[A10]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[A11]] = and i1 [[A10]], [[A10]], RenamedOp: [[A11]] } +; CHECK-NEXT:    [[TMP4:%.*]] = bitcast i1 [[A11]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[A12]] = and i1 [[A11]], [[A11]], RenamedOp: [[A12]] } +; CHECK-NEXT:    [[TMP5:%.*]] = bitcast i1 [[A12]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[A13]] = and i1 [[A12]], [[A12]], RenamedOp: [[A13]] } +; CHECK-NEXT:    [[TMP6:%.*]] = bitcast i1 [[A13]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[A14]] = and i1 [[A13]], [[A13]], RenamedOp: [[A14]] } +; CHECK-NEXT:    [[TMP7:%.*]] = bitcast i1 [[A14]] to i1 +; CHECK-NEXT:  ; assume predicate info { Comparison: [[A15]] = and i1 [[A14]], [[A14]], RenamedOp: [[A15]] } +; CHECK-NEXT:    [[TMP8:%.*]] = bitcast i1 [[A15]] to i1  ; CHECK-NEXT:    call void @foo(i1 [[A1]])  ; CHECK-NEXT:    call void @foo(i1 [[A2]])  ; CHECK-NEXT:    call void @foo(i1 [[A3]]) @@ -1001,13 +1105,15 @@ define i32 @test_and_with_phinode(i32 %x) {  ; CHECK-NEXT:    [[XGE1:%.*]] = icmp uge i32 [[X:%.*]], 1  ; CHECK-NEXT:    [[XLT2:%.*]] = icmp ult i32 [[X]], 2  ; CHECK-NEXT:    [[AND:%.*]] = and i1 [[XGE1]], [[XLT2]] -; CHECK:         [[X_0_1:%.*]] = bitcast i32 [[X]] to i32 -; CHECK:         [[X_0_2:%.*]] = bitcast i32 [[X_0_1]] to i32 -; CHECK-NEXT:    br i1 [[AND]], label [[PHI:%.*]], label [[NOPE:%.*]] +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XGE1]] = icmp uge i32 [[X]], 1 Edge: [label [[ENTRY:%.*]],label [[PHI:%.*]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0_1:%.*]] = bitcast i32 [[X]] to i32 +; CHECK-NEXT:  ; branch predicate info { TrueEdge: 1 Comparison: [[XLT2]] = icmp ult i32 [[X]], 2 Edge: [label [[ENTRY]],label [[PHI]]], RenamedOp: [[X]] } +; CHECK-NEXT:    [[X_0_2:%.*]] = bitcast i32 [[X_0_1]] to i32 +; CHECK-NEXT:    br i1 [[AND]], label [[PHI]], label [[NOPE:%.*]]  ; CHECK:       nope:  ; CHECK-NEXT:    br label [[PHI]]  ; CHECK:       phi: -; CHECK-NEXT:    [[RES:%.*]] = phi i32 [ [[X_0_2]], [[ENTRY:%.*]] ], [ 1, [[NOPE]] ] +; CHECK-NEXT:    [[RES:%.*]] = phi i32 [ [[X_0_2]], [[ENTRY]] ], [ 1, [[NOPE]] ]  ; CHECK-NEXT:    ret i32 [[RES]]  ;  entry: | 
