1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py 2; RUN: opt -S -verify-loop-info -passes=irce < %s | FileCheck %s 3; RUN: opt -S -verify-loop-info -passes='require<branch-prob>,irce' < %s | FileCheck %s 4 5define void @f_0(ptr %arr, ptr %a_len_ptr, i32 %n, ptr %cond_buf) { 6; CHECK-LABEL: @f_0( 7; CHECK-NEXT: entry: 8; CHECK-NEXT: [[LEN:%.*]] = load i32, ptr [[A_LEN_PTR:%.*]], align 4, !range [[RNG0:![0-9]+]] 9; CHECK-NEXT: [[FIRST_ITR_CHECK:%.*]] = icmp sgt i32 [[N:%.*]], 0 10; CHECK-NEXT: br i1 [[FIRST_ITR_CHECK]], label [[LOOP_PREHEADER:%.*]], label [[EXIT:%.*]] 11; CHECK: loop.preheader: 12; CHECK-NEXT: [[TMP0:%.*]] = add nsw i32 [[LEN]], -4 13; CHECK-NEXT: [[SMIN:%.*]] = call i32 @llvm.smin.i32(i32 [[N]], i32 [[TMP0]]) 14; CHECK-NEXT: [[EXIT_MAINLOOP_AT:%.*]] = call i32 @llvm.smax.i32(i32 [[SMIN]], i32 0) 15; CHECK-NEXT: [[TMP1:%.*]] = icmp slt i32 0, [[EXIT_MAINLOOP_AT]] 16; CHECK-NEXT: br i1 [[TMP1]], label [[LOOP_PREHEADER1:%.*]], label [[MAIN_PSEUDO_EXIT:%.*]] 17; CHECK: loop.preheader1: 18; CHECK-NEXT: br label [[LOOP:%.*]] 19; CHECK: loop: 20; CHECK-NEXT: [[IDX:%.*]] = phi i32 [ [[IDX_NEXT:%.*]], [[IN_BOUNDS:%.*]] ], [ 0, [[LOOP_PREHEADER1]] ] 21; CHECK-NEXT: [[IDX_NEXT]] = add nsw i32 [[IDX]], 1 22; CHECK-NEXT: [[IDX_FOR_ABC:%.*]] = add i32 [[IDX]], 4 23; CHECK-NEXT: [[ABC_ACTUAL:%.*]] = icmp slt i32 [[IDX_FOR_ABC]], [[LEN]] 24; CHECK-NEXT: [[COND:%.*]] = load volatile i1, ptr [[COND_BUF:%.*]], align 1 25; CHECK-NEXT: [[ABC:%.*]] = and i1 [[COND]], true 26; CHECK-NEXT: br i1 [[ABC]], label [[IN_BOUNDS]], label [[OUT_OF_BOUNDS_LOOPEXIT2:%.*]], !prof [[PROF1:![0-9]+]] 27; CHECK: in.bounds: 28; CHECK-NEXT: [[ADDR:%.*]] = getelementptr i32, ptr [[ARR:%.*]], i32 [[IDX_FOR_ABC]] 29; CHECK-NEXT: store i32 0, ptr [[ADDR]], align 4 30; CHECK-NEXT: [[NEXT:%.*]] = icmp slt i32 [[IDX_NEXT]], [[N]] 31; CHECK-NEXT: [[TMP2:%.*]] = icmp slt i32 [[IDX_NEXT]], [[EXIT_MAINLOOP_AT]] 32; CHECK-NEXT: br i1 [[TMP2]], label [[LOOP]], label [[MAIN_EXIT_SELECTOR:%.*]] 33; CHECK: main.exit.selector: 34; CHECK-NEXT: [[IDX_NEXT_LCSSA:%.*]] = phi i32 [ [[IDX_NEXT]], [[IN_BOUNDS]] ] 35; CHECK-NEXT: [[TMP3:%.*]] = icmp slt i32 [[IDX_NEXT_LCSSA]], [[N]] 36; CHECK-NEXT: br i1 [[TMP3]], label [[MAIN_PSEUDO_EXIT]], label [[EXIT_LOOPEXIT:%.*]] 37; CHECK: main.pseudo.exit: 38; CHECK-NEXT: [[IDX_COPY:%.*]] = phi i32 [ 0, [[LOOP_PREHEADER]] ], [ [[IDX_NEXT_LCSSA]], [[MAIN_EXIT_SELECTOR]] ] 39; CHECK-NEXT: [[INDVAR_END:%.*]] = phi i32 [ 0, [[LOOP_PREHEADER]] ], [ [[IDX_NEXT_LCSSA]], [[MAIN_EXIT_SELECTOR]] ] 40; CHECK-NEXT: br label [[POSTLOOP:%.*]] 41; CHECK: out.of.bounds.loopexit: 42; CHECK-NEXT: br label [[OUT_OF_BOUNDS:%.*]] 43; CHECK: out.of.bounds.loopexit2: 44; CHECK-NEXT: br label [[OUT_OF_BOUNDS]] 45; CHECK: out.of.bounds: 46; CHECK-NEXT: ret void 47; CHECK: exit.loopexit.loopexit: 48; CHECK-NEXT: br label [[EXIT_LOOPEXIT]] 49; CHECK: exit.loopexit: 50; CHECK-NEXT: br label [[EXIT]] 51; CHECK: exit: 52; CHECK-NEXT: ret void 53; CHECK: postloop: 54; CHECK-NEXT: br label [[LOOP_POSTLOOP:%.*]] 55; CHECK: loop.postloop: 56; CHECK-NEXT: [[IDX_POSTLOOP:%.*]] = phi i32 [ [[IDX_NEXT_POSTLOOP:%.*]], [[IN_BOUNDS_POSTLOOP:%.*]] ], [ [[IDX_COPY]], [[POSTLOOP]] ] 57; CHECK-NEXT: [[IDX_NEXT_POSTLOOP]] = add i32 [[IDX_POSTLOOP]], 1 58; CHECK-NEXT: [[IDX_FOR_ABC_POSTLOOP:%.*]] = add i32 [[IDX_POSTLOOP]], 4 59; CHECK-NEXT: [[ABC_ACTUAL_POSTLOOP:%.*]] = icmp slt i32 [[IDX_FOR_ABC_POSTLOOP]], [[LEN]] 60; CHECK-NEXT: [[COND_POSTLOOP:%.*]] = load volatile i1, ptr [[COND_BUF]], align 1 61; CHECK-NEXT: [[ABC_POSTLOOP:%.*]] = and i1 [[COND_POSTLOOP]], [[ABC_ACTUAL_POSTLOOP]] 62; CHECK-NEXT: br i1 [[ABC_POSTLOOP]], label [[IN_BOUNDS_POSTLOOP]], label [[OUT_OF_BOUNDS_LOOPEXIT:%.*]], !prof [[PROF1]] 63; CHECK: in.bounds.postloop: 64; CHECK-NEXT: [[ADDR_POSTLOOP:%.*]] = getelementptr i32, ptr [[ARR]], i32 [[IDX_FOR_ABC_POSTLOOP]] 65; CHECK-NEXT: store i32 0, ptr [[ADDR_POSTLOOP]], align 4 66; CHECK-NEXT: [[NEXT_POSTLOOP:%.*]] = icmp slt i32 [[IDX_NEXT_POSTLOOP]], [[N]] 67; CHECK-NEXT: br i1 [[NEXT_POSTLOOP]], label [[LOOP_POSTLOOP]], label [[EXIT_LOOPEXIT_LOOPEXIT:%.*]], !llvm.loop [[LOOP2:![0-9]+]], !loop_constrainer.loop.clone [[META7:![0-9]+]] 68; 69entry: 70 %len = load i32, ptr %a_len_ptr, !range !0 71 %first.itr.check = icmp sgt i32 %n, 0 72 br i1 %first.itr.check, label %loop, label %exit 73 74loop: 75 %idx = phi i32 [ 0, %entry ] , [ %idx.next, %in.bounds ] 76 %idx.next = add i32 %idx, 1 77 %idx.for.abc = add i32 %idx, 4 78 %abc.actual = icmp slt i32 %idx.for.abc, %len 79 %cond = load volatile i1, ptr %cond_buf 80 %abc = and i1 %cond, %abc.actual 81 br i1 %abc, label %in.bounds, label %out.of.bounds, !prof !1 82 83in.bounds: 84 %addr = getelementptr i32, ptr %arr, i32 %idx.for.abc 85 store i32 0, ptr %addr 86 %next = icmp slt i32 %idx.next, %n 87 br i1 %next, label %loop, label %exit 88 89out.of.bounds: 90 ret void 91 92exit: 93 ret void 94} 95 96define void @f_1( 97; CHECK-LABEL: @f_1( 98; CHECK-NEXT: entry: 99; CHECK-NEXT: [[LEN_A:%.*]] = load i32, ptr [[A_LEN_PTR:%.*]], align 4, !range [[RNG0]] 100; CHECK-NEXT: [[LEN_B:%.*]] = load i32, ptr [[B_LEN_PTR:%.*]], align 4, !range [[RNG0]] 101; CHECK-NEXT: [[FIRST_ITR_CHECK:%.*]] = icmp sgt i32 [[N:%.*]], 0 102; CHECK-NEXT: br i1 [[FIRST_ITR_CHECK]], label [[LOOP_PREHEADER:%.*]], label [[EXIT:%.*]] 103; CHECK: loop.preheader: 104; CHECK-NEXT: [[SMIN:%.*]] = call i32 @llvm.smin.i32(i32 [[LEN_B]], i32 [[LEN_A]]) 105; CHECK-NEXT: [[SMIN1:%.*]] = call i32 @llvm.smin.i32(i32 [[SMIN]], i32 [[N]]) 106; CHECK-NEXT: [[EXIT_MAINLOOP_AT:%.*]] = call i32 @llvm.smax.i32(i32 [[SMIN1]], i32 0) 107; CHECK-NEXT: [[TMP0:%.*]] = icmp slt i32 0, [[EXIT_MAINLOOP_AT]] 108; CHECK-NEXT: br i1 [[TMP0]], label [[LOOP_PREHEADER2:%.*]], label [[MAIN_PSEUDO_EXIT:%.*]] 109; CHECK: loop.preheader2: 110; CHECK-NEXT: br label [[LOOP:%.*]] 111; CHECK: loop: 112; CHECK-NEXT: [[IDX:%.*]] = phi i32 [ [[IDX_NEXT:%.*]], [[IN_BOUNDS:%.*]] ], [ 0, [[LOOP_PREHEADER2]] ] 113; CHECK-NEXT: [[IDX_NEXT]] = add nsw i32 [[IDX]], 1 114; CHECK-NEXT: [[ABC_A:%.*]] = icmp slt i32 [[IDX]], [[LEN_A]] 115; CHECK-NEXT: [[ABC_B:%.*]] = icmp slt i32 [[IDX]], [[LEN_B]] 116; CHECK-NEXT: [[ABC:%.*]] = and i1 true, true 117; CHECK-NEXT: br i1 [[ABC]], label [[IN_BOUNDS]], label [[OUT_OF_BOUNDS_LOOPEXIT3:%.*]], !prof [[PROF1]] 118; CHECK: in.bounds: 119; CHECK-NEXT: [[ADDR_A:%.*]] = getelementptr i32, ptr [[ARR_A:%.*]], i32 [[IDX]] 120; CHECK-NEXT: store i32 0, ptr [[ADDR_A]], align 4 121; CHECK-NEXT: [[ADDR_B:%.*]] = getelementptr i32, ptr [[ARR_B:%.*]], i32 [[IDX]] 122; CHECK-NEXT: store i32 -1, ptr [[ADDR_B]], align 4 123; CHECK-NEXT: [[NEXT:%.*]] = icmp slt i32 [[IDX_NEXT]], [[N]] 124; CHECK-NEXT: [[TMP1:%.*]] = icmp slt i32 [[IDX_NEXT]], [[EXIT_MAINLOOP_AT]] 125; CHECK-NEXT: br i1 [[TMP1]], label [[LOOP]], label [[MAIN_EXIT_SELECTOR:%.*]] 126; CHECK: main.exit.selector: 127; CHECK-NEXT: [[IDX_NEXT_LCSSA:%.*]] = phi i32 [ [[IDX_NEXT]], [[IN_BOUNDS]] ] 128; CHECK-NEXT: [[TMP2:%.*]] = icmp slt i32 [[IDX_NEXT_LCSSA]], [[N]] 129; CHECK-NEXT: br i1 [[TMP2]], label [[MAIN_PSEUDO_EXIT]], label [[EXIT_LOOPEXIT:%.*]] 130; CHECK: main.pseudo.exit: 131; CHECK-NEXT: [[IDX_COPY:%.*]] = phi i32 [ 0, [[LOOP_PREHEADER]] ], [ [[IDX_NEXT_LCSSA]], [[MAIN_EXIT_SELECTOR]] ] 132; CHECK-NEXT: [[INDVAR_END:%.*]] = phi i32 [ 0, [[LOOP_PREHEADER]] ], [ [[IDX_NEXT_LCSSA]], [[MAIN_EXIT_SELECTOR]] ] 133; CHECK-NEXT: br label [[POSTLOOP:%.*]] 134; CHECK: out.of.bounds.loopexit: 135; CHECK-NEXT: br label [[OUT_OF_BOUNDS:%.*]] 136; CHECK: out.of.bounds.loopexit3: 137; CHECK-NEXT: br label [[OUT_OF_BOUNDS]] 138; CHECK: out.of.bounds: 139; CHECK-NEXT: ret void 140; CHECK: exit.loopexit.loopexit: 141; CHECK-NEXT: br label [[EXIT_LOOPEXIT]] 142; CHECK: exit.loopexit: 143; CHECK-NEXT: br label [[EXIT]] 144; CHECK: exit: 145; CHECK-NEXT: ret void 146; CHECK: postloop: 147; CHECK-NEXT: br label [[LOOP_POSTLOOP:%.*]] 148; CHECK: loop.postloop: 149; CHECK-NEXT: [[IDX_POSTLOOP:%.*]] = phi i32 [ [[IDX_NEXT_POSTLOOP:%.*]], [[IN_BOUNDS_POSTLOOP:%.*]] ], [ [[IDX_COPY]], [[POSTLOOP]] ] 150; CHECK-NEXT: [[IDX_NEXT_POSTLOOP]] = add i32 [[IDX_POSTLOOP]], 1 151; CHECK-NEXT: [[ABC_A_POSTLOOP:%.*]] = icmp slt i32 [[IDX_POSTLOOP]], [[LEN_A]] 152; CHECK-NEXT: [[ABC_B_POSTLOOP:%.*]] = icmp slt i32 [[IDX_POSTLOOP]], [[LEN_B]] 153; CHECK-NEXT: [[ABC_POSTLOOP:%.*]] = and i1 [[ABC_A_POSTLOOP]], [[ABC_B_POSTLOOP]] 154; CHECK-NEXT: br i1 [[ABC_POSTLOOP]], label [[IN_BOUNDS_POSTLOOP]], label [[OUT_OF_BOUNDS_LOOPEXIT:%.*]], !prof [[PROF1]] 155; CHECK: in.bounds.postloop: 156; CHECK-NEXT: [[ADDR_A_POSTLOOP:%.*]] = getelementptr i32, ptr [[ARR_A]], i32 [[IDX_POSTLOOP]] 157; CHECK-NEXT: store i32 0, ptr [[ADDR_A_POSTLOOP]], align 4 158; CHECK-NEXT: [[ADDR_B_POSTLOOP:%.*]] = getelementptr i32, ptr [[ARR_B]], i32 [[IDX_POSTLOOP]] 159; CHECK-NEXT: store i32 -1, ptr [[ADDR_B_POSTLOOP]], align 4 160; CHECK-NEXT: [[NEXT_POSTLOOP:%.*]] = icmp slt i32 [[IDX_NEXT_POSTLOOP]], [[N]] 161; CHECK-NEXT: br i1 [[NEXT_POSTLOOP]], label [[LOOP_POSTLOOP]], label [[EXIT_LOOPEXIT_LOOPEXIT:%.*]], !llvm.loop [[LOOP8:![0-9]+]], !loop_constrainer.loop.clone [[META7]] 162; 163 ptr %arr_a, ptr %a_len_ptr, ptr %arr_b, ptr %b_len_ptr, i32 %n) { 164 165 166entry: 167 %len.a = load i32, ptr %a_len_ptr, !range !0 168 %len.b = load i32, ptr %b_len_ptr, !range !0 169 %first.itr.check = icmp sgt i32 %n, 0 170 br i1 %first.itr.check, label %loop, label %exit 171 172loop: 173 %idx = phi i32 [ 0, %entry ] , [ %idx.next, %in.bounds ] 174 %idx.next = add i32 %idx, 1 175 %abc.a = icmp slt i32 %idx, %len.a 176 %abc.b = icmp slt i32 %idx, %len.b 177 %abc = and i1 %abc.a, %abc.b 178 br i1 %abc, label %in.bounds, label %out.of.bounds, !prof !1 179 180in.bounds: 181 %addr.a = getelementptr i32, ptr %arr_a, i32 %idx 182 store i32 0, ptr %addr.a 183 %addr.b = getelementptr i32, ptr %arr_b, i32 %idx 184 store i32 -1, ptr %addr.b 185 %next = icmp slt i32 %idx.next, %n 186 br i1 %next, label %loop, label %exit 187 188out.of.bounds: 189 ret void 190 191exit: 192 ret void 193} 194 195!0 = !{i32 0, i32 2147483647} 196!1 = !{!"branch_weights", i32 64, i32 4} 197