1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py 2; RUN: opt -passes=loop-vectorize -force-vector-width=4 -force-vector-interleave=1 -S %s | FileCheck %s 3 4define i32 @sink_load_that_uses_for_past_other_loads(ptr noalias %A, ptr noalias %B) { 5; CHECK-LABEL: @sink_load_that_uses_for_past_other_loads( 6; CHECK-NEXT: entry: 7; CHECK-NEXT: br label [[LOOP:%.*]] 8; CHECK: loop: 9; CHECK-NEXT: [[IV:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ] 10; CHECK-NEXT: [[FOR:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[FOR_NEXT:%.*]], [[LOOP]] ] 11; CHECK-NEXT: [[RED:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[RED_NEXT:%.*]], [[LOOP]] ] 12; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A:%.*]], i32 [[FOR]] 13; CHECK-NEXT: [[L_A:%.*]] = load i32, ptr [[GEP_A]], align 4 14; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr inbounds i32, ptr [[B:%.*]], i32 [[IV]] 15; CHECK-NEXT: [[FOR_NEXT]] = load i32, ptr [[GEP_B]], align 4 16; CHECK-NEXT: [[ADD:%.*]] = add i32 [[FOR]], [[L_A]] 17; CHECK-NEXT: [[RED_NEXT]] = add i32 [[RED]], [[ADD]] 18; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i32 [[IV]], 1 19; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV_NEXT]], 1000 20; CHECK-NEXT: br i1 [[EC]], label [[EXIT:%.*]], label [[LOOP]] 21; CHECK: exit: 22; CHECK-NEXT: [[RED_NEXT_LCSSA:%.*]] = phi i32 [ [[RED_NEXT]], [[LOOP]] ] 23; CHECK-NEXT: ret i32 [[RED_NEXT_LCSSA]] 24; 25entry: 26 br label %loop 27 28loop: 29 %iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ] 30 %for = phi i32 [ 0, %entry ], [ %for.next, %loop ] 31 %red = phi i32 [ 0, %entry ], [ %red.next, %loop ] 32 %gep.a = getelementptr inbounds i32, ptr %A, i32 %for 33 %l.a = load i32, ptr %gep.a 34 %gep.b = getelementptr inbounds i32, ptr %B, i32 %iv 35 %for.next = load i32, ptr %gep.b 36 %add = add i32 %for, %l.a 37 %red.next = add i32 %red, %add 38 %iv.next = add nuw nsw i32 %iv, 1 39 %ec = icmp eq i32 %iv.next, 1000 40 br i1 %ec, label %exit, label %loop 41 42exit: 43 ret i32 %red.next 44} 45 46define void @cannot_sink_load_past_mayalias_store(ptr noalias %A, ptr noalias %B) { 47; CHECK-LABEL: @cannot_sink_load_past_mayalias_store( 48; CHECK-NEXT: entry: 49; CHECK-NEXT: br label [[LOOP:%.*]] 50; CHECK: loop: 51; CHECK-NEXT: [[IV:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ] 52; CHECK-NEXT: [[FOR:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[FOR_NEXT:%.*]], [[LOOP]] ] 53; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A:%.*]], i32 [[FOR]] 54; CHECK-NEXT: [[L_A:%.*]] = load i32, ptr [[GEP_A]], align 4 55; CHECK-NEXT: [[GEP_A_2:%.*]] = getelementptr inbounds i32, ptr [[A]], i32 [[IV]] 56; CHECK-NEXT: [[ADD:%.*]] = add i32 [[FOR]], [[L_A]] 57; CHECK-NEXT: store i32 [[ADD]], ptr [[GEP_A_2]], align 4 58; CHECK-NEXT: [[FOR_NEXT]] = load i32, ptr [[GEP_A_2]], align 4 59; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i32 [[IV]], 1 60; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV_NEXT]], 1000 61; CHECK-NEXT: br i1 [[EC]], label [[EXIT:%.*]], label [[LOOP]] 62; CHECK: exit: 63; CHECK-NEXT: ret void 64; 65entry: 66 br label %loop 67 68loop: 69 %iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ] 70 %for = phi i32 [ 0, %entry ], [ %for.next, %loop ] 71 %gep.a = getelementptr inbounds i32, ptr %A, i32 %for 72 %l.a = load i32, ptr %gep.a 73 %gep.a.2 = getelementptr inbounds i32, ptr %A, i32 %iv 74 %add = add i32 %for, %l.a 75 store i32 %add, ptr %gep.a.2 76 %for.next = load i32, ptr %gep.a.2 77 %iv.next = add nuw nsw i32 %iv, 1 78 %ec = icmp eq i32 %iv.next, 1000 79 br i1 %ec, label %exit, label %loop 80 81exit: 82 ret void 83} 84 85define void @sink_store_that_uses_for_past_instructions(ptr noalias %A, ptr noalias %B) { 86; CHECK-LABEL: @sink_store_that_uses_for_past_instructions( 87; CHECK-NEXT: entry: 88; CHECK-NEXT: br label [[LOOP:%.*]] 89; CHECK: loop: 90; CHECK-NEXT: [[IV:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ] 91; CHECK-NEXT: [[FOR:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[FOR_NEXT:%.*]], [[LOOP]] ] 92; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A:%.*]], i32 [[IV]] 93; CHECK-NEXT: store i32 [[FOR]], ptr [[GEP_A]], align 4 94; CHECK-NEXT: [[FOR_NEXT]] = add i32 [[IV]], 2 95; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i32 [[IV]], 1 96; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV_NEXT]], 1000 97; CHECK-NEXT: br i1 [[EC]], label [[EXIT:%.*]], label [[LOOP]] 98; CHECK: exit: 99; CHECK-NEXT: ret void 100; 101entry: 102 br label %loop 103 104loop: 105 %iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ] 106 %for = phi i32 [ 0, %entry ], [ %for.next, %loop ] 107 %gep.a = getelementptr inbounds i32, ptr %A, i32 %iv 108 store i32 %for, ptr %gep.a 109 %for.next = add i32 %iv, 2 110 %iv.next = add nuw nsw i32 %iv, 1 111 %ec = icmp eq i32 %iv.next, 1000 112 br i1 %ec, label %exit, label %loop 113 114exit: 115 ret void 116} 117 118define void @sink_store_past_non_aliasing_load(ptr noalias %A, ptr noalias %B) { 119; CHECK-LABEL: @sink_store_past_non_aliasing_load( 120; CHECK-NEXT: entry: 121; CHECK-NEXT: br label [[LOOP:%.*]] 122; CHECK: loop: 123; CHECK-NEXT: [[IV:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ] 124; CHECK-NEXT: [[FOR:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[FOR_NEXT:%.*]], [[LOOP]] ] 125; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A:%.*]], i32 [[IV]] 126; CHECK-NEXT: store i32 [[FOR]], ptr [[GEP_A]], align 4 127; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr inbounds i32, ptr [[B:%.*]], i32 [[IV]] 128; CHECK-NEXT: [[FOR_NEXT]] = load i32, ptr [[GEP_B]], align 4 129; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i32 [[IV]], 1 130; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV_NEXT]], 1000 131; CHECK-NEXT: br i1 [[EC]], label [[EXIT:%.*]], label [[LOOP]] 132; CHECK: exit: 133; CHECK-NEXT: ret void 134; 135entry: 136 br label %loop 137 138loop: 139 %iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ] 140 %for = phi i32 [ 0, %entry ], [ %for.next, %loop ] 141 %gep.a = getelementptr inbounds i32, ptr %A, i32 %iv 142 store i32 %for, ptr %gep.a 143 %gep.b = getelementptr inbounds i32, ptr %B, i32 %iv 144 %for.next = load i32, ptr %gep.b 145 %iv.next = add nuw nsw i32 %iv, 1 146 %ec = icmp eq i32 %iv.next, 1000 147 br i1 %ec, label %exit, label %loop 148 149exit: 150 ret void 151} 152 153define void @sink_store_past_aliasing_load(ptr %A, ptr %B) { 154; CHECK-LABEL: @sink_store_past_aliasing_load( 155; CHECK-NEXT: entry: 156; CHECK-NEXT: br label [[LOOP:%.*]] 157; CHECK: loop: 158; CHECK-NEXT: [[IV:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ] 159; CHECK-NEXT: [[FOR:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[FOR_NEXT:%.*]], [[LOOP]] ] 160; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A:%.*]], i32 [[IV]] 161; CHECK-NEXT: store i32 [[FOR]], ptr [[GEP_A]], align 4 162; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr inbounds i32, ptr [[B:%.*]], i32 [[IV]] 163; CHECK-NEXT: [[FOR_NEXT]] = load i32, ptr [[GEP_B]], align 4 164; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i32 [[IV]], 1 165; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV_NEXT]], 1000 166; CHECK-NEXT: br i1 [[EC]], label [[EXIT:%.*]], label [[LOOP]] 167; CHECK: exit: 168; CHECK-NEXT: ret void 169; 170entry: 171 br label %loop 172 173loop: 174 %iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ] 175 %for = phi i32 [ 0, %entry ], [ %for.next, %loop ] 176 %gep.a = getelementptr inbounds i32, ptr %A, i32 %iv 177 store i32 %for, ptr %gep.a 178 %gep.b = getelementptr inbounds i32, ptr %B, i32 %iv 179 %for.next = load i32, ptr %gep.b 180 %iv.next = add nuw nsw i32 %iv, 1 181 %ec = icmp eq i32 %iv.next, 1000 182 br i1 %ec, label %exit, label %loop 183 184exit: 185 ret void 186} 187 188define void @sink_store_past_non_aliasing_store(ptr noalias %A, ptr noalias %B) { 189; CHECK-LABEL: @sink_store_past_non_aliasing_store( 190; CHECK-NEXT: entry: 191; CHECK-NEXT: br label [[LOOP:%.*]] 192; CHECK: loop: 193; CHECK-NEXT: [[IV:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ] 194; CHECK-NEXT: [[FOR:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[FOR_NEXT:%.*]], [[LOOP]] ] 195; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A:%.*]], i32 [[IV]] 196; CHECK-NEXT: store i32 [[FOR]], ptr [[GEP_A]], align 4 197; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr inbounds i32, ptr [[B:%.*]], i32 [[IV]] 198; CHECK-NEXT: store i32 123, ptr [[GEP_B]], align 4 199; CHECK-NEXT: [[FOR_NEXT]] = add i32 [[IV]], 2 200; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i32 [[IV]], 1 201; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV_NEXT]], 1000 202; CHECK-NEXT: br i1 [[EC]], label [[EXIT:%.*]], label [[LOOP]] 203; CHECK: exit: 204; CHECK-NEXT: ret void 205; 206entry: 207 br label %loop 208 209loop: 210 %iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ] 211 %for = phi i32 [ 0, %entry ], [ %for.next, %loop ] 212 %gep.a = getelementptr inbounds i32, ptr %A, i32 %iv 213 store i32 %for, ptr %gep.a 214 %gep.b = getelementptr inbounds i32, ptr %B, i32 %iv 215 store i32 123, ptr %gep.b 216 %for.next = add i32 %iv, 2 217 %iv.next = add nuw nsw i32 %iv, 1 218 %ec = icmp eq i32 %iv.next, 1000 219 br i1 %ec, label %exit, label %loop 220 221exit: 222 ret void 223} 224 225define void @sink_store_past_aliasing_store(ptr %A, ptr %B) { 226; CHECK-LABEL: @sink_store_past_aliasing_store( 227; CHECK-NEXT: entry: 228; CHECK-NEXT: br label [[LOOP:%.*]] 229; CHECK: loop: 230; CHECK-NEXT: [[IV:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ] 231; CHECK-NEXT: [[FOR:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[FOR_NEXT:%.*]], [[LOOP]] ] 232; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A:%.*]], i32 [[IV]] 233; CHECK-NEXT: store i32 [[FOR]], ptr [[GEP_A]], align 4 234; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr inbounds i32, ptr [[B:%.*]], i32 [[IV]] 235; CHECK-NEXT: store i32 123, ptr [[GEP_B]], align 4 236; CHECK-NEXT: [[FOR_NEXT]] = add i32 [[IV]], 2 237; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i32 [[IV]], 1 238; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV_NEXT]], 1000 239; CHECK-NEXT: br i1 [[EC]], label [[EXIT:%.*]], label [[LOOP]] 240; CHECK: exit: 241; CHECK-NEXT: ret void 242; 243entry: 244 br label %loop 245 246loop: 247 %iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ] 248 %for = phi i32 [ 0, %entry ], [ %for.next, %loop ] 249 %gep.a = getelementptr inbounds i32, ptr %A, i32 %iv 250 store i32 %for, ptr %gep.a 251 %gep.b = getelementptr inbounds i32, ptr %B, i32 %iv 252 store i32 123, ptr %gep.b 253 %for.next = add i32 %iv, 2 254 %iv.next = add nuw nsw i32 %iv, 1 255 %ec = icmp eq i32 %iv.next, 1000 256 br i1 %ec, label %exit, label %loop 257 258exit: 259 ret void 260} 261