; NOTE: Assertions have been autogenerated by utils/update_test_checks.py ; RUN: opt < %s -passes=indvars -indvars-predicate-loops=1 -S | FileCheck %s ; Nested loops with body using loop convergence token should be skipped by IndVarSimplify. declare token @llvm.experimental.convergence.entry() #0 define void @nested(i32 %tidx, i32 %tidy, ptr %array) #0 { ; CHECK-LABEL: @nested( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[TMP0:%.*]] = tail call token @llvm.experimental.convergence.entry() ; CHECK-NEXT: [[MUL_I:%.*]] = shl nsw i32 [[TIDX:%.*]], 3 ; CHECK-NEXT: [[ADD_I:%.*]] = add nsw i32 [[MUL_I]], [[TIDY:%.*]] ; CHECK-NEXT: br label [[FOR_COND_I:%.*]] ; CHECK: for.cond.i: ; CHECK-NEXT: [[I_0_I:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC10_I:%.*]], [[CLEANUP_I:%.*]] ] ; CHECK-NEXT: [[TMP1:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[TMP0]]) ] ; CHECK-NEXT: [[CMP_I:%.*]] = icmp samesign ult i32 [[I_0_I]], 8 ; CHECK-NEXT: br i1 [[CMP_I]], label [[FOR_COND1_I_PREHEADER:%.*]], label [[EXIT:%.*]] ; CHECK: for.cond1.i.preheader: ; CHECK-NEXT: [[CMP5_I:%.*]] = icmp eq i32 [[I_0_I]], [[TIDX]] ; CHECK-NEXT: br label [[FOR_COND1_I:%.*]] ; CHECK: for.cond1.i: ; CHECK-NEXT: [[J_0_I:%.*]] = phi i32 [ [[INC_I:%.*]], [[FOR_BODY4_I:%.*]] ], [ 0, [[FOR_COND1_I_PREHEADER]] ] ; CHECK-NEXT: [[TMP2:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[TMP1]]) ] ; CHECK-NEXT: [[CMP2_I:%.*]] = icmp samesign ult i32 [[J_0_I]], 8 ; CHECK-NEXT: br i1 [[CMP2_I]], label [[FOR_BODY4_I]], label [[CLEANUP_I_LOOPEXIT:%.*]] ; CHECK: for.body4.i: ; CHECK-NEXT: [[CMP6_I:%.*]] = icmp eq i32 [[J_0_I]], [[TIDY]] ; CHECK-NEXT: [[OR_COND:%.*]] = select i1 [[CMP5_I]], i1 [[CMP6_I]], i1 false ; CHECK-NEXT: [[INC_I]] = add nuw nsw i32 [[J_0_I]], 1 ; CHECK-NEXT: br i1 [[OR_COND]], label [[IF_THEN_I:%.*]], label [[FOR_COND1_I]] ; CHECK: cleanup.i.loopexit: ; CHECK-NEXT: br label [[CLEANUP_I]] ; CHECK: if.then.i: ; CHECK-NEXT: [[HLSL_WAVE_ACTIVE_MAX7_I:%.*]] = call spir_func i32 @llvm.spv.wave.reduce.umax.i32(i32 [[ADD_I]]) [ "convergencectrl"(token [[TMP2]]) ] ; CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds i32, ptr [[ARRAY:%.*]], i32 [[ADD_I]] ; CHECK-NEXT: store i32 [[HLSL_WAVE_ACTIVE_MAX7_I]], ptr [[TMP3]], align 4 ; CHECK-NEXT: br label [[CLEANUP_I]] ; CHECK: cleanup.i: ; CHECK-NEXT: [[INC10_I]] = add nuw nsw i32 [[I_0_I]], 1 ; CHECK-NEXT: br label [[FOR_COND_I]] ; CHECK: exit: ; CHECK-NEXT: ret void ; entry: %0 = tail call token @llvm.experimental.convergence.entry() %mul.i = shl nsw i32 %tidx, 3 %add.i = add nsw i32 %mul.i, %tidy br label %for.cond.i for.cond.i: %i.0.i = phi i32 [ 0, %entry ], [ %inc10.i, %cleanup.i ] %2 = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %0) ] %cmp.i = icmp ult i32 %i.0.i, 8 br i1 %cmp.i, label %for.cond1.i.preheader, label %exit for.cond1.i.preheader: %cmp5.i = icmp eq i32 %i.0.i, %tidx br label %for.cond1.i for.cond1.i: %j.0.i = phi i32 [ %inc.i, %for.body4.i ], [ 0, %for.cond1.i.preheader ] %3 = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %2) ] %cmp2.i = icmp ult i32 %j.0.i, 8 br i1 %cmp2.i, label %for.body4.i, label %cleanup.i.loopexit for.body4.i: %cmp6.i = icmp eq i32 %j.0.i, %tidy %or.cond = select i1 %cmp5.i, i1 %cmp6.i, i1 false %inc.i = add nsw i32 %j.0.i, 1 br i1 %or.cond, label %if.then.i, label %for.cond1.i cleanup.i.loopexit: br label %cleanup.i if.then.i: %hlsl.wave.active.max7.i = call spir_func i32 @llvm.spv.wave.reduce.umax.i32(i32 %add.i) [ "convergencectrl"(token %3) ] %4 = getelementptr inbounds i32, ptr %array, i32 %add.i store i32 %hlsl.wave.active.max7.i, ptr %4, align 4 br label %cleanup.i cleanup.i: %inc10.i = add nsw i32 %i.0.i, 1 br label %for.cond.i exit: ret void } declare token @llvm.experimental.convergence.loop() #0 declare i32 @llvm.spv.wave.reduce.umax.i32(i32) #0 attributes #0 = { convergent }