; NOTE: Assertions have been autogenerated by utils/update_test_checks.py ; RUN: opt < %s -passes=loop-unroll -unroll-runtime -unroll-allow-partial -S | FileCheck %s declare void @f() convergent declare void @g() ; Although this loop contains a convergent instruction, it should be ; fully unrolled. define i32 @full_unroll() { ; CHECK-LABEL: @full_unroll( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: br label [[L3:%.*]] ; CHECK: l3: ; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ] ; CHECK-NEXT: br label [[A:%.*]] ; CHECK: a: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_1:%.*]] ; CHECK: a.1: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_2:%.*]] ; CHECK: a.2: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: ret i32 0 ; entry: %anchor = call token @llvm.experimental.convergence.anchor() br label %l3 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %a ] %tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ] %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, 3 br label %a a: call void @f() [ "convergencectrl"(token %tok.loop) ] br i1 %exitcond, label %exit, label %l3 exit: ret i32 0 } ; This loop contains a convergent instruction, but it should be partially ; unrolled. The unroll count is the largest power of 2 that divides the ; multiple -- 4, in this case. define i32 @runtime_unroll(i32 %n) { ; CHECK-LABEL: @runtime_unroll( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: [[LOOP_CTL:%.*]] = mul nsw i32 [[N:%.*]], 12 ; CHECK-NEXT: br label [[L3:%.*]] ; CHECK: l3: ; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC_3:%.*]], [[A_3:%.*]] ] ; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ] ; CHECK-NEXT: br label [[A:%.*]] ; CHECK: a: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_1:%.*]] ; CHECK: a.1: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_2:%.*]] ; CHECK: a.2: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_3]] ; CHECK: a.3: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: [[INC_3]] = add nsw i32 [[X_0]], 4 ; CHECK-NEXT: [[EXITCOND_3:%.*]] = icmp eq i32 [[INC_3]], [[LOOP_CTL]] ; CHECK-NEXT: br i1 [[EXITCOND_3]], label [[EXIT:%.*]], label [[L3]] ; CHECK: exit: ; CHECK-NEXT: ret i32 0 ; entry: %anchor = call token @llvm.experimental.convergence.anchor() %loop_ctl = mul nsw i32 %n, 12 br label %l3 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %a ] %tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ] br label %a a: call void @f() [ "convergencectrl"(token %tok.loop) ] %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, %loop_ctl br i1 %exitcond, label %exit, label %l3 exit: ret i32 0 } ; This loop contains a convergent instruction, so its partial unroll ; count must divide its trip multiple. This overrides its unroll ; pragma -- we unroll exactly 8 times, even though 16 is requested. define i32 @pragma_unroll(i32 %n) { ; CHECK-LABEL: @pragma_unroll( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: [[LOOP_CTL:%.*]] = mul nsw i32 [[N:%.*]], 24 ; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP0:![0-9]+]] ; CHECK: l3: ; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC_7:%.*]], [[A_7:%.*]] ] ; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ] ; CHECK-NEXT: br label [[A:%.*]] ; CHECK: a: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_1:%.*]] ; CHECK: a.1: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_2:%.*]] ; CHECK: a.2: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_3:%.*]] ; CHECK: a.3: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_4:%.*]] ; CHECK: a.4: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_5:%.*]] ; CHECK: a.5: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_6:%.*]] ; CHECK: a.6: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: br label [[A_7]] ; CHECK: a.7: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: [[INC_7]] = add nsw i32 [[X_0]], 8 ; CHECK-NEXT: [[EXITCOND_7:%.*]] = icmp eq i32 [[INC_7]], [[LOOP_CTL]] ; CHECK-NEXT: br i1 [[EXITCOND_7]], label [[EXIT:%.*]], label [[L3]], !llvm.loop [[LOOP2:![0-9]+]] ; CHECK: exit: ; CHECK-NEXT: ret i32 0 ; entry: %anchor = call token @llvm.experimental.convergence.anchor() %loop_ctl = mul nsw i32 %n, 24 br label %l3, !llvm.loop !0 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %a ] %tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ] br label %a a: call void @f() [ "convergencectrl"(token %tok.loop) ] %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, %loop_ctl br i1 %exitcond, label %exit, label %l3, !llvm.loop !0 exit: ret i32 0 } ; This loop contains a convergent instruction. Since the pragma loop unroll ; count 2 divides trip count 4. The loop unroll should respect the pragma. define void @pragma_unroll_divisible_trip_count() { ; CHECK-LABEL: @pragma_unroll_divisible_trip_count( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4:![0-9]+]] ; CHECK: l3: ; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC_1:%.*]], [[L3]] ] ; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ] ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: [[INC_1]] = add nuw nsw i32 [[X_0]], 2 ; CHECK-NEXT: [[EXITCOND_1:%.*]] = icmp eq i32 [[INC_1]], 4 ; CHECK-NEXT: br i1 [[EXITCOND_1]], label [[EXIT:%.*]], label [[L3]], !llvm.loop [[LOOP6:![0-9]+]] ; CHECK: exit: ; CHECK-NEXT: ret void ; entry: %anchor = call token @llvm.experimental.convergence.anchor() br label %l3, !llvm.loop !1 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ] %tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ] call void @f() [ "convergencectrl"(token %tok.loop) ] %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, 4 br i1 %exitcond, label %exit, label %l3, !llvm.loop !1 exit: ret void } ; This loop contains a convergent instruction. Since the pragma loop unroll ; count 2 divides trip multiple 2. The loop unroll should respect the pragma. define i32 @pragma_unroll_divisible_trip_multiple(i32 %n) { ; CHECK-LABEL: @pragma_unroll_divisible_trip_multiple( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: [[LOOP_CTL:%.*]] = mul nsw i32 [[N:%.*]], 2 ; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l3: ; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC_1:%.*]], [[L3]] ] ; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ] ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: [[INC_1]] = add nsw i32 [[X_0]], 2 ; CHECK-NEXT: [[EXITCOND_1:%.*]] = icmp eq i32 [[INC_1]], [[LOOP_CTL]] ; CHECK-NEXT: br i1 [[EXITCOND_1]], label [[EXIT:%.*]], label [[L3]], !llvm.loop [[LOOP7:![0-9]+]] ; CHECK: exit: ; CHECK-NEXT: ret i32 0 ; entry: %anchor = call token @llvm.experimental.convergence.anchor() %loop_ctl = mul nsw i32 %n, 2 br label %l3, !llvm.loop !1 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ] %tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ] call void @f() [ "convergencectrl"(token %tok.loop) ] %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, %loop_ctl br i1 %exitcond, label %exit, label %l3, !llvm.loop !1 exit: ret i32 0 } ; This loop contains a convergent instruction. Since the pragma loop unroll ; count 2 is unknown to divide runtime trip count, the loop is not unrolled ; since remainder is forbidden for unrolling convergent loop. define i32 @pragma_unroll_indivisible_runtime_trip_count(i32 %n) { ; CHECK-LABEL: @pragma_unroll_indivisible_runtime_trip_count( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l3: ; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[L3]] ] ; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ] ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: [[INC]] = add nsw i32 [[X_0]], 1 ; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i32 [[INC]], [[N:%.*]] ; CHECK-NEXT: br i1 [[EXITCOND]], label [[EXIT:%.*]], label [[L3]], !llvm.loop [[LOOP4]] ; CHECK: exit: ; CHECK-NEXT: ret i32 0 ; entry: %anchor = call token @llvm.experimental.convergence.anchor() br label %l3, !llvm.loop !1 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ] %tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ] call void @f() [ "convergencectrl"(token %tok.loop) ] %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, %n br i1 %exitcond, label %exit, label %l3, !llvm.loop !1 exit: ret i32 0 } ; This loop contains a convergent instruction. Since the pragma loop unroll ; count 2 does not divide trip count 5, the loop is not unrolled by 2 ; since remainder is forbidden for unrolling convergent loop. Instead, the ; loop gets fully unrolled. define i32 @pragma_unroll_indivisible_trip_count() { ; CHECK-LABEL: @pragma_unroll_indivisible_trip_count( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l3: ; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ] ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: ret i32 0 ; entry: %anchor = call token @llvm.experimental.convergence.anchor() br label %l3, !llvm.loop !1 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ] %tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ] call void @f() [ "convergencectrl"(token %tok.loop) ] %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, 5 br i1 %exitcond, label %exit, label %l3, !llvm.loop !1 exit: ret i32 0 } ; This loop contains a convergent instruction that is anchored inside the loop ; itself. It is unrolled by 2 with remainder, as requested by the loop metadata. define i32 @pragma_unroll_with_remainder(i32 %n) { ; CHECK-LABEL: @pragma_unroll_with_remainder( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[TMP0:%.*]] = freeze i32 [[N:%.*]] ; CHECK-NEXT: [[TMP1:%.*]] = add i32 [[TMP0]], -1 ; CHECK-NEXT: [[XTRAITER:%.*]] = and i32 [[TMP0]], 1 ; CHECK-NEXT: [[TMP2:%.*]] = icmp ult i32 [[TMP1]], 1 ; CHECK-NEXT: br i1 [[TMP2]], label [[EXIT_UNR_LCSSA:%.*]], label [[ENTRY_NEW:%.*]] ; CHECK: entry.new: ; CHECK-NEXT: [[UNROLL_ITER:%.*]] = sub i32 [[TMP0]], [[XTRAITER]] ; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l3: ; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY_NEW]] ], [ [[INC_1:%.*]], [[L3]] ] ; CHECK-NEXT: [[NITER:%.*]] = phi i32 [ 0, [[ENTRY_NEW]] ], [ [[NITER_NEXT_1:%.*]], [[L3]] ] ; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: [[TOK_LOOP_1:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP_1]]) ] ; CHECK-NEXT: [[INC_1]] = add nsw i32 [[X_0]], 2 ; CHECK-NEXT: [[NITER_NEXT_1]] = add i32 [[NITER]], 2 ; CHECK-NEXT: [[NITER_NCMP_1:%.*]] = icmp eq i32 [[NITER_NEXT_1]], [[UNROLL_ITER]] ; CHECK-NEXT: br i1 [[NITER_NCMP_1]], label [[EXIT_UNR_LCSSA_LOOPEXIT:%.*]], label [[L3]], !llvm.loop [[LOOP8:![0-9]+]] ; CHECK: exit.unr-lcssa.loopexit: ; CHECK-NEXT: br label [[EXIT_UNR_LCSSA]] ; CHECK: exit.unr-lcssa: ; CHECK-NEXT: [[LCMP_MOD:%.*]] = icmp ne i32 [[XTRAITER]], 0 ; CHECK-NEXT: br i1 [[LCMP_MOD]], label [[L3_EPIL_PREHEADER:%.*]], label [[EXIT:%.*]] ; CHECK: l3.epil.preheader: ; CHECK-NEXT: br label [[L3_EPIL:%.*]] ; CHECK: l3.epil: ; CHECK-NEXT: [[TOK_LOOP_EPIL:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP_EPIL]]) ] ; CHECK-NEXT: br label [[EXIT]] ; CHECK: exit: ; CHECK-NEXT: ret i32 0 ; entry: br label %l3, !llvm.loop !1 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ] %tok.loop = call token @llvm.experimental.convergence.anchor() call void @f() [ "convergencectrl"(token %tok.loop) ] %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, %n br i1 %exitcond, label %exit, label %l3, !llvm.loop !1 exit: ret i32 0 } ; Don't unroll a loop that is extended by convergence controls. ; ; We could theoretically duplicate the extension part, but this is not ; implemented. define i32 @extended_loop(i32 %n) { ; CHECK-LABEL: @extended_loop( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l3: ; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[L3]] ] ; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: [[INC]] = add nsw i32 [[X_0]], 1 ; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i32 [[INC]], [[N:%.*]] ; CHECK-NEXT: br i1 [[EXITCOND]], label [[EXIT:%.*]], label [[L3]], !llvm.loop [[LOOP4]] ; CHECK: exit: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ] ; CHECK-NEXT: ret i32 0 ; entry: br label %l3, !llvm.loop !1 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ] %tok.loop = call token @llvm.experimental.convergence.anchor() %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, %n br i1 %exitcond, label %exit, label %l3, !llvm.loop !1 exit: call void @f() [ "convergencectrl"(token %tok.loop) ] ret i32 0 } ; Inner loop is extended beyond the outer loop. No unrolling possible. define i32 @extended_inner_loop_1(i32 %n, i1 %cond) { ; CHECK-LABEL: @extended_inner_loop_1( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[L3:%.*]] ; CHECK: l3: ; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[LATCH:%.*]] ] ; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: [[INC]] = add nsw i32 [[X_0]], 1 ; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i32 [[INC]], 4 ; CHECK-NEXT: br label [[L2:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2: ; CHECK-NEXT: [[TOK_L2:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2]]) ] ; CHECK-NEXT: br i1 [[COND:%.*]], label [[L2]], label [[LATCH]], !llvm.loop [[LOOP4]] ; CHECK: latch: ; CHECK-NEXT: br i1 [[EXITCOND]], label [[EXIT:%.*]], label [[L3]] ; CHECK: exit: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2]]) ] ; CHECK-NEXT: ret i32 0 ; entry: br label %l3 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %latch ] %tok.loop = call token @llvm.experimental.convergence.anchor() %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, 4 br label %l2, !llvm.loop !1 l2: %tok.l2 = call token @llvm.experimental.convergence.anchor() call void @f() [ "convergencectrl"(token %tok.l2) ] br i1 %cond, label %l2, label %latch, !llvm.loop !1 latch: br i1 %exitcond, label %exit, label %l3 exit: call void @f() [ "convergencectrl"(token %tok.l2) ] ret i32 0 } ; Inner loop is extended inside the outer loop. Outer loop is unrolled. define i32 @extended_inner_loop_2(i32 %n, i1 %cond) { ; CHECK-LABEL: @extended_inner_loop_2( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[L3:%.*]] ; CHECK: l3: ; CHECK-NEXT: br label [[L2:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2: ; CHECK-NEXT: [[TOK_L2:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2]]) ] ; CHECK-NEXT: br i1 [[COND:%.*]], label [[L2]], label [[LATCH:%.*]], !llvm.loop [[LOOP4]] ; CHECK: latch: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2]]) ] ; CHECK-NEXT: br label [[L2_1:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2.1: ; CHECK-NEXT: [[TOK_L2_1:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1]]) ] ; CHECK-NEXT: br i1 [[COND]], label [[L2_1]], label [[LATCH_1:%.*]], !llvm.loop [[LOOP4]] ; CHECK: latch.1: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1]]) ] ; CHECK-NEXT: br label [[L2_2:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2.2: ; CHECK-NEXT: [[TOK_L2_2:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_2]]) ] ; CHECK-NEXT: br i1 [[COND]], label [[L2_2]], label [[LATCH_2:%.*]], !llvm.loop [[LOOP4]] ; CHECK: latch.2: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_2]]) ] ; CHECK-NEXT: br label [[L2_3:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2.3: ; CHECK-NEXT: [[TOK_L2_3:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_3]]) ] ; CHECK-NEXT: br i1 [[COND]], label [[L2_3]], label [[LATCH_3:%.*]], !llvm.loop [[LOOP4]] ; CHECK: latch.3: ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_3]]) ] ; CHECK-NEXT: ret i32 0 ; entry: br label %l3 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %latch ] %tok.loop = call token @llvm.experimental.convergence.anchor() %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, 4 br label %l2, !llvm.loop !1 l2: %tok.l2 = call token @llvm.experimental.convergence.anchor() call void @f() [ "convergencectrl"(token %tok.l2) ] br i1 %cond, label %l2, label %latch, !llvm.loop !1 latch: call void @f() [ "convergencectrl"(token %tok.l2) ] br i1 %exitcond, label %exit, label %l3 exit: ret i32 0 } ; No extension. Both loops unrolled. define i32 @unroll_nest(i32 %n, i1 %cond) { ; CHECK-LABEL: @unroll_nest( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[L3:%.*]] ; CHECK: l3: ; CHECK-NEXT: br label [[L2:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2: ; CHECK-NEXT: [[TOK_L2:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2]]) ] ; CHECK-NEXT: br i1 [[COND:%.*]], label [[L2_1:%.*]], label [[LATCH:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2.1: ; CHECK-NEXT: [[TOK_L2_1:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1]]) ] ; CHECK-NEXT: br i1 [[COND]], label [[L2]], label [[LATCH]], !llvm.loop [[LOOP9:![0-9]+]] ; CHECK: latch: ; CHECK-NEXT: br label [[L2_12:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2.12: ; CHECK-NEXT: [[TOK_L2_11:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_11]]) ] ; CHECK-NEXT: br i1 [[COND]], label [[L2_1_1:%.*]], label [[LATCH_1:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2.1.1: ; CHECK-NEXT: [[TOK_L2_1_1:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1_1]]) ] ; CHECK-NEXT: br i1 [[COND]], label [[L2_12]], label [[LATCH_1]], !llvm.loop [[LOOP9]] ; CHECK: latch.1: ; CHECK-NEXT: br label [[L2_2:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2.2: ; CHECK-NEXT: [[TOK_L2_2:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_2]]) ] ; CHECK-NEXT: br i1 [[COND]], label [[L2_1_2:%.*]], label [[LATCH_2:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2.1.2: ; CHECK-NEXT: [[TOK_L2_1_2:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1_2]]) ] ; CHECK-NEXT: br i1 [[COND]], label [[L2_2]], label [[LATCH_2]], !llvm.loop [[LOOP9]] ; CHECK: latch.2: ; CHECK-NEXT: br label [[L2_3:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2.3: ; CHECK-NEXT: [[TOK_L2_3:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_3]]) ] ; CHECK-NEXT: br i1 [[COND]], label [[L2_1_3:%.*]], label [[LATCH_3:%.*]], !llvm.loop [[LOOP4]] ; CHECK: l2.1.3: ; CHECK-NEXT: [[TOK_L2_1_3:%.*]] = call token @llvm.experimental.convergence.anchor() ; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1_3]]) ] ; CHECK-NEXT: br i1 [[COND]], label [[L2_3]], label [[LATCH_3]], !llvm.loop [[LOOP9]] ; CHECK: latch.3: ; CHECK-NEXT: ret i32 0 ; entry: br label %l3 l3: %x.0 = phi i32 [ 0, %entry ], [ %inc, %latch ] %tok.loop = call token @llvm.experimental.convergence.anchor() %inc = add nsw i32 %x.0, 1 %exitcond = icmp eq i32 %inc, 4 br label %l2, !llvm.loop !1 l2: %tok.l2 = call token @llvm.experimental.convergence.anchor() call void @f() [ "convergencectrl"(token %tok.l2) ] br i1 %cond, label %l2, label %latch, !llvm.loop !1 latch: br i1 %exitcond, label %exit, label %l3 exit: ret i32 0 } declare token @llvm.experimental.convergence.anchor() declare token @llvm.experimental.convergence.loop() !0 = !{!0, !{!"llvm.loop.unroll.count", i32 16}} !1 = !{!1, !{!"llvm.loop.unroll.count", i32 2}}