176db6d80SeopXD; NOTE: Assertions have been autogenerated by utils/update_test_checks.py 276db6d80SeopXD; RUN: opt -passes="function(loop(indvars,loop-idiom,loop-deletion),simplifycfg)" -S < %s | FileCheck %s 376db6d80SeopXD; Compile command: 476db6d80SeopXD; $ clang -m64 -fno-discard-value-names -O0 -S -emit-llvm -Xclang -disable-O0-optnone Code.c 545fcdaf6SRoman Lebedev; $ bin/opt -S -passes=mem2reg,loop-simplify,lcssa,loop-rotate \ 645fcdaf6SRoman Lebedev; -passes=licm,simple-loop-unswitch -enable-nontrivial-unswitch -passes=loop-simplify \ 745fcdaf6SRoman Lebedev; -passes=loop-deletion,simplifycfg,indvars Code.ll > CodeOpt.ll 876db6d80SeopXDtarget datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128" 976db6d80SeopXD; void PositiveFor64(int *ar, long long n, long long m) 1076db6d80SeopXD; { 1176db6d80SeopXD; long long i; 1276db6d80SeopXD; for (i=0; i<n; ++i) { 1376db6d80SeopXD; int *arr = ar + i * m; 1476db6d80SeopXD; memset(arr, 0, m * sizeof(int)); 1576db6d80SeopXD; } 1676db6d80SeopXD; } 17*7a752e81SNikita Popovdefine dso_local void @PositiveFor64(ptr %ar, i64 %n, i64 %m) { 1876db6d80SeopXD; CHECK-LABEL: @PositiveFor64( 1976db6d80SeopXD; CHECK-NEXT: entry: 2076db6d80SeopXD; CHECK-NEXT: [[CMP1:%.*]] = icmp slt i64 0, [[N:%.*]] 2176db6d80SeopXD; CHECK-NEXT: br i1 [[CMP1]], label [[FOR_BODY_LR_PH:%.*]], label [[FOR_END:%.*]] 2276db6d80SeopXD; CHECK: for.body.lr.ph: 2376db6d80SeopXD; CHECK-NEXT: [[MUL1:%.*]] = mul i64 [[M:%.*]], 4 2476db6d80SeopXD; CHECK-NEXT: [[TMP0:%.*]] = mul i64 [[M]], [[N]] 2576db6d80SeopXD; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[TMP0]], 2 26*7a752e81SNikita Popov; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 4 [[AR:%.*]], i8 0, i64 [[TMP1]], i1 false) 2776db6d80SeopXD; CHECK-NEXT: br label [[FOR_END]] 2876db6d80SeopXD; CHECK: for.end: 2976db6d80SeopXD; CHECK-NEXT: ret void 3076db6d80SeopXD; 3176db6d80SeopXDentry: 3276db6d80SeopXD %cmp1 = icmp slt i64 0, %n 3376db6d80SeopXD br i1 %cmp1, label %for.body.lr.ph, label %for.end 3476db6d80SeopXD 3576db6d80SeopXDfor.body.lr.ph: ; preds = %entry 3676db6d80SeopXD %mul1 = mul i64 %m, 4 3776db6d80SeopXD br label %for.body 3876db6d80SeopXD 3976db6d80SeopXDfor.body: ; preds = %for.body.lr.ph, %for.body 4076db6d80SeopXD %i.02 = phi i64 [ 0, %for.body.lr.ph ], [ %inc, %for.body ] 4176db6d80SeopXD %mul = mul nsw i64 %i.02, %m 42*7a752e81SNikita Popov %add.ptr = getelementptr inbounds i32, ptr %ar, i64 %mul 43*7a752e81SNikita Popov call void @llvm.memset.p0.i64(ptr align 4 %add.ptr, i8 0, i64 %mul1, i1 false) 4476db6d80SeopXD %inc = add nsw i64 %i.02, 1 4576db6d80SeopXD %cmp = icmp slt i64 %inc, %n 4676db6d80SeopXD br i1 %cmp, label %for.body, label %for.end 4776db6d80SeopXD 4876db6d80SeopXDfor.end: ; preds = %for.body, %entry 4976db6d80SeopXD ret void 5076db6d80SeopXD} 5176db6d80SeopXD; void NegativeFor64(int *ar, long long n, long long m) 5276db6d80SeopXD; { 5376db6d80SeopXD; long long i; 5476db6d80SeopXD; for (i=n-1; i>=0; --i) { 5576db6d80SeopXD; int *arr = ar + i * m; 5676db6d80SeopXD; memset(arr, 0, m * sizeof(int)); 5776db6d80SeopXD; } 5876db6d80SeopXD; } 59*7a752e81SNikita Popovdefine dso_local void @NegativeFor64(ptr %ar, i64 %n, i64 %m) { 6076db6d80SeopXD; CHECK-LABEL: @NegativeFor64( 6176db6d80SeopXD; CHECK-NEXT: entry: 6276db6d80SeopXD; CHECK-NEXT: [[SUB:%.*]] = sub nsw i64 [[N:%.*]], 1 6376db6d80SeopXD; CHECK-NEXT: [[CMP1:%.*]] = icmp sge i64 [[SUB]], 0 6476db6d80SeopXD; CHECK-NEXT: br i1 [[CMP1]], label [[FOR_BODY_LR_PH:%.*]], label [[FOR_END:%.*]] 6576db6d80SeopXD; CHECK: for.body.lr.ph: 6676db6d80SeopXD; CHECK-NEXT: [[MUL1:%.*]] = mul i64 [[M:%.*]], 4 6776db6d80SeopXD; CHECK-NEXT: [[TMP0:%.*]] = mul i64 [[M]], [[N]] 6876db6d80SeopXD; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[TMP0]], 2 69*7a752e81SNikita Popov; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 4 [[AR:%.*]], i8 0, i64 [[TMP1]], i1 false) 7076db6d80SeopXD; CHECK-NEXT: br label [[FOR_END]] 7176db6d80SeopXD; CHECK: for.end: 7276db6d80SeopXD; CHECK-NEXT: ret void 7376db6d80SeopXD; 7476db6d80SeopXDentry: 7576db6d80SeopXD %sub = sub nsw i64 %n, 1 7676db6d80SeopXD %cmp1 = icmp sge i64 %sub, 0 7776db6d80SeopXD br i1 %cmp1, label %for.body.lr.ph, label %for.end 7876db6d80SeopXD 7976db6d80SeopXDfor.body.lr.ph: ; preds = %entry 8076db6d80SeopXD %mul1 = mul i64 %m, 4 8176db6d80SeopXD br label %for.body 8276db6d80SeopXD 8376db6d80SeopXDfor.body: ; preds = %for.body.lr.ph, %for.body 8476db6d80SeopXD %i.02 = phi i64 [ %sub, %for.body.lr.ph ], [ %dec, %for.body ] 8576db6d80SeopXD %mul = mul nsw i64 %i.02, %m 86*7a752e81SNikita Popov %add.ptr = getelementptr inbounds i32, ptr %ar, i64 %mul 87*7a752e81SNikita Popov call void @llvm.memset.p0.i64(ptr align 4 %add.ptr, i8 0, i64 %mul1, i1 false) 8876db6d80SeopXD %dec = add nsw i64 %i.02, -1 8976db6d80SeopXD %cmp = icmp sge i64 %dec, 0 9076db6d80SeopXD br i1 %cmp, label %for.body, label %for.end 9176db6d80SeopXD 9276db6d80SeopXDfor.end: ; preds = %for.body, %entry 9376db6d80SeopXD ret void 9476db6d80SeopXD} 9576db6d80SeopXD; void NestedFor64(int *ar, long long n, long long m, long long o) 9676db6d80SeopXD; { 9776db6d80SeopXD; long long i, j; 9876db6d80SeopXD; for (i=0; i<n; ++i) { 9976db6d80SeopXD; for (j=0; j<m; j++) { 10076db6d80SeopXD; int *arr = ar + i * m * o + j * o; 10176db6d80SeopXD; memset(arr, 0, o * sizeof(int)); 10276db6d80SeopXD; } 10376db6d80SeopXD; } 10476db6d80SeopXD; } 105*7a752e81SNikita Popovdefine void @NestedFor64(ptr %ar, i64 %n, i64 %m, i64 %o) { 10676db6d80SeopXD; CHECK-LABEL: @NestedFor64( 10776db6d80SeopXD; CHECK-NEXT: entry: 10876db6d80SeopXD; CHECK-NEXT: [[CMP3:%.*]] = icmp slt i64 0, [[N:%.*]] 10976db6d80SeopXD; CHECK-NEXT: [[CMP21:%.*]] = icmp slt i64 0, [[M:%.*]] 11076db6d80SeopXD; CHECK-NEXT: [[MUL7:%.*]] = mul i64 [[O:%.*]], 4 11176db6d80SeopXD; CHECK-NEXT: [[OR_COND:%.*]] = select i1 [[CMP3]], i1 [[CMP21]], i1 false 11276db6d80SeopXD; CHECK-NEXT: br i1 [[OR_COND]], label [[FOR_BODY_US_PREHEADER:%.*]], label [[FOR_END10:%.*]] 11376db6d80SeopXD; CHECK: for.body.us.preheader: 11476db6d80SeopXD; CHECK-NEXT: [[TMP0:%.*]] = mul i64 [[O]], [[M]] 11576db6d80SeopXD; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[TMP0]], 2 11676db6d80SeopXD; CHECK-NEXT: [[TMP2:%.*]] = mul i64 [[TMP0]], [[N]] 11776db6d80SeopXD; CHECK-NEXT: [[TMP3:%.*]] = shl i64 [[TMP2]], 2 118*7a752e81SNikita Popov; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 4 [[AR:%.*]], i8 0, i64 [[TMP3]], i1 false) 11976db6d80SeopXD; CHECK-NEXT: br label [[FOR_END10]] 12076db6d80SeopXD; CHECK: for.end10: 12176db6d80SeopXD; CHECK-NEXT: ret void 12276db6d80SeopXD; 12376db6d80SeopXDentry: 12476db6d80SeopXD %cmp3 = icmp slt i64 0, %n 12576db6d80SeopXD br i1 %cmp3, label %for.body.lr.ph, label %for.end10 12676db6d80SeopXD 12776db6d80SeopXDfor.body.lr.ph: ; preds = %entry 12876db6d80SeopXD %cmp21 = icmp slt i64 0, %m 12976db6d80SeopXD %mul7 = mul i64 %o, 4 13076db6d80SeopXD br i1 %cmp21, label %for.body.us.preheader, label %for.end10 13176db6d80SeopXD 13276db6d80SeopXDfor.body.us.preheader: ; preds = %for.body.lr.ph 13376db6d80SeopXD br label %for.body.us 13476db6d80SeopXD 13576db6d80SeopXDfor.body.us: ; preds = %for.body.us.preheader, %for.cond1.for.end_crit_edge.us 13676db6d80SeopXD %i.04.us = phi i64 [ %inc9.us, %for.cond1.for.end_crit_edge.us ], [ 0, %for.body.us.preheader ] 13776db6d80SeopXD %mul.us = mul nsw i64 %i.04.us, %m 13876db6d80SeopXD %mul4.us = mul nsw i64 %mul.us, %o 139*7a752e81SNikita Popov %add.ptr.us = getelementptr inbounds i32, ptr %ar, i64 %mul4.us 14076db6d80SeopXD br label %for.body3.us 14176db6d80SeopXD 14276db6d80SeopXDfor.body3.us: ; preds = %for.body.us, %for.body3.us 14376db6d80SeopXD %j.02.us = phi i64 [ 0, %for.body.us ], [ %inc.us, %for.body3.us ] 14476db6d80SeopXD %mul5.us = mul nsw i64 %j.02.us, %o 145*7a752e81SNikita Popov %add.ptr6.us = getelementptr inbounds i32, ptr %add.ptr.us, i64 %mul5.us 146*7a752e81SNikita Popov call void @llvm.memset.p0.i64(ptr align 4 %add.ptr6.us, i8 0, i64 %mul7, i1 false) 14776db6d80SeopXD %inc.us = add nuw nsw i64 %j.02.us, 1 14876db6d80SeopXD %exitcond = icmp ne i64 %inc.us, %m 14976db6d80SeopXD br i1 %exitcond, label %for.body3.us, label %for.cond1.for.end_crit_edge.us 15076db6d80SeopXD 15176db6d80SeopXDfor.cond1.for.end_crit_edge.us: ; preds = %for.body3.us 15276db6d80SeopXD %inc9.us = add nuw nsw i64 %i.04.us, 1 15376db6d80SeopXD %exitcond5 = icmp ne i64 %inc9.us, %n 15476db6d80SeopXD br i1 %exitcond5, label %for.body.us, label %for.end10.loopexit 15576db6d80SeopXD 15676db6d80SeopXDfor.end10.loopexit: ; preds = %for.cond1.for.end_crit_edge.us 15776db6d80SeopXD br label %for.end10 15876db6d80SeopXD 15976db6d80SeopXDfor.end10: ; preds = %for.end10.loopexit, %for.body.lr.ph, %entry 16076db6d80SeopXD ret void 16176db6d80SeopXD} 16276db6d80SeopXD; void PositiveFor32(int *ar, int n, int m) 16376db6d80SeopXD; { 16476db6d80SeopXD; int i; 16576db6d80SeopXD; for (i=0; i<n; ++i) { 16676db6d80SeopXD; int *arr = ar + i * m; 16776db6d80SeopXD; memset(arr, 0, m * sizeof(int)); 16876db6d80SeopXD; } 16976db6d80SeopXD; } 170*7a752e81SNikita Popovdefine void @PositiveFor32(ptr %ar, i32 %n, i32 %m) { 17176db6d80SeopXD; CHECK-LABEL: @PositiveFor32( 17276db6d80SeopXD; CHECK-NEXT: entry: 17376db6d80SeopXD; CHECK-NEXT: [[CONV:%.*]] = sext i32 [[N:%.*]] to i64 17476db6d80SeopXD; CHECK-NEXT: [[CMP1:%.*]] = icmp slt i64 0, [[CONV]] 17576db6d80SeopXD; CHECK-NEXT: br i1 [[CMP1]], label [[FOR_BODY_LR_PH:%.*]], label [[FOR_END:%.*]] 17676db6d80SeopXD; CHECK: for.body.lr.ph: 17776db6d80SeopXD; CHECK-NEXT: [[CONV1:%.*]] = sext i32 [[M:%.*]] to i64 17876db6d80SeopXD; CHECK-NEXT: [[CONV2:%.*]] = sext i32 [[M]] to i64 17976db6d80SeopXD; CHECK-NEXT: [[MUL3:%.*]] = mul i64 [[CONV2]], 4 18076db6d80SeopXD; CHECK-NEXT: [[TMP0:%.*]] = mul i64 [[CONV1]], [[CONV]] 18176db6d80SeopXD; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[TMP0]], 2 182*7a752e81SNikita Popov; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 4 [[AR:%.*]], i8 0, i64 [[TMP1]], i1 false) 18376db6d80SeopXD; CHECK-NEXT: br label [[FOR_END]] 18476db6d80SeopXD; CHECK: for.end: 18576db6d80SeopXD; CHECK-NEXT: ret void 18676db6d80SeopXD; 18776db6d80SeopXDentry: 18876db6d80SeopXD %conv = sext i32 %n to i64 18976db6d80SeopXD %cmp1 = icmp slt i64 0, %conv 19076db6d80SeopXD br i1 %cmp1, label %for.body.lr.ph, label %for.end 19176db6d80SeopXD 19276db6d80SeopXDfor.body.lr.ph: ; preds = %entry 19376db6d80SeopXD %conv1 = sext i32 %m to i64 19476db6d80SeopXD %conv2 = sext i32 %m to i64 19576db6d80SeopXD %mul3 = mul i64 %conv2, 4 19676db6d80SeopXD br label %for.body 19776db6d80SeopXD 19876db6d80SeopXDfor.body: ; preds = %for.body.lr.ph, %for.body 19976db6d80SeopXD %i.02 = phi i64 [ 0, %for.body.lr.ph ], [ %inc, %for.body ] 20076db6d80SeopXD %mul = mul nsw i64 %i.02, %conv1 201*7a752e81SNikita Popov %add.ptr = getelementptr inbounds i32, ptr %ar, i64 %mul 202*7a752e81SNikita Popov call void @llvm.memset.p0.i64(ptr align 4 %add.ptr, i8 0, i64 %mul3, i1 false) 20376db6d80SeopXD %inc = add nsw i64 %i.02, 1 20476db6d80SeopXD %cmp = icmp slt i64 %inc, %conv 20576db6d80SeopXD br i1 %cmp, label %for.body, label %for.end 20676db6d80SeopXD 20776db6d80SeopXDfor.end: ; preds = %for.body, %entry 20876db6d80SeopXD ret void 20976db6d80SeopXD} 21076db6d80SeopXD; void Negative32(int *ar, int n, int m) 21176db6d80SeopXD; { 21276db6d80SeopXD; long long i; 21376db6d80SeopXD; for (i=n-1; i>=0; i--) { 21476db6d80SeopXD; int *arr = ar + i * m; 21576db6d80SeopXD; memset(arr, 0, m * sizeof(int)); 21676db6d80SeopXD; } 21776db6d80SeopXD; } 218*7a752e81SNikita Popovdefine void @Negative32(ptr %ar, i32 %n, i32 %m) { 21976db6d80SeopXD; CHECK-LABEL: @Negative32( 22076db6d80SeopXD; CHECK-NEXT: entry: 22176db6d80SeopXD; CHECK-NEXT: [[SUB:%.*]] = sub nsw i32 [[N:%.*]], 1 22276db6d80SeopXD; CHECK-NEXT: [[CONV:%.*]] = sext i32 [[SUB]] to i64 22376db6d80SeopXD; CHECK-NEXT: [[CMP1:%.*]] = icmp sge i64 [[CONV]], 0 22476db6d80SeopXD; CHECK-NEXT: br i1 [[CMP1]], label [[FOR_BODY_LR_PH:%.*]], label [[FOR_END:%.*]] 22576db6d80SeopXD; CHECK: for.body.lr.ph: 22676db6d80SeopXD; CHECK-NEXT: [[CONV1:%.*]] = sext i32 [[M:%.*]] to i64 22776db6d80SeopXD; CHECK-NEXT: [[CONV2:%.*]] = sext i32 [[M]] to i64 22876db6d80SeopXD; CHECK-NEXT: [[MUL3:%.*]] = mul i64 [[CONV2]], 4 229d9715a72SNikita Popov; CHECK-NEXT: [[TMP0:%.*]] = sext i32 [[N]] to i64 23076db6d80SeopXD; CHECK-NEXT: [[TMP1:%.*]] = mul i64 [[CONV1]], [[TMP0]] 23176db6d80SeopXD; CHECK-NEXT: [[TMP2:%.*]] = shl i64 [[TMP1]], 2 232*7a752e81SNikita Popov; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 4 [[AR:%.*]], i8 0, i64 [[TMP2]], i1 false) 23376db6d80SeopXD; CHECK-NEXT: br label [[FOR_END]] 23476db6d80SeopXD; CHECK: for.end: 23576db6d80SeopXD; CHECK-NEXT: ret void 23676db6d80SeopXD; 23776db6d80SeopXDentry: 23876db6d80SeopXD %sub = sub nsw i32 %n, 1 23976db6d80SeopXD %conv = sext i32 %sub to i64 24076db6d80SeopXD %cmp1 = icmp sge i64 %conv, 0 24176db6d80SeopXD br i1 %cmp1, label %for.body.lr.ph, label %for.end 24276db6d80SeopXD 24376db6d80SeopXDfor.body.lr.ph: ; preds = %entry 24476db6d80SeopXD %conv1 = sext i32 %m to i64 24576db6d80SeopXD %conv2 = sext i32 %m to i64 24676db6d80SeopXD %mul3 = mul i64 %conv2, 4 24776db6d80SeopXD br label %for.body 24876db6d80SeopXD 24976db6d80SeopXDfor.body: ; preds = %for.body.lr.ph, %for.body 25076db6d80SeopXD %i.02 = phi i64 [ %conv, %for.body.lr.ph ], [ %dec, %for.body ] 25176db6d80SeopXD %mul = mul nsw i64 %i.02, %conv1 252*7a752e81SNikita Popov %add.ptr = getelementptr inbounds i32, ptr %ar, i64 %mul 253*7a752e81SNikita Popov call void @llvm.memset.p0.i64(ptr align 4 %add.ptr, i8 0, i64 %mul3, i1 false) 25476db6d80SeopXD %dec = add nsw i64 %i.02, -1 25576db6d80SeopXD %cmp = icmp sge i64 %dec, 0 25676db6d80SeopXD br i1 %cmp, label %for.body, label %for.end 25776db6d80SeopXD 25876db6d80SeopXDfor.end: ; preds = %for.body, %entry 25976db6d80SeopXD ret void 26076db6d80SeopXD} 261bc17d32aSeopXD; This case requires SCEVFolder in LoopIdiomRecognize.cpp to fold SCEV prior to comparison. 262bc17d32aSeopXD; For the inner-loop, SCEVFolder is not needed, however the promoted memset size would be based 263bc17d32aSeopXD; on the trip count of inner-loop (which is an unsigned integer). 264bc17d32aSeopXD; Then in the outer loop, the pointer stride SCEV for memset needs to be converted based on the 265bc17d32aSeopXD; loop guard for it to equal to the memset size SCEV. The loop guard guaranteeds that m >= 0 266bc17d32aSeopXD; inside the loop, so m can be converted from sext to zext, making the two SCEV-s equal. 26776db6d80SeopXD; void NestedFor32(int *ar, int n, int m, int o) 26876db6d80SeopXD; { 26976db6d80SeopXD; int i, j; 27076db6d80SeopXD; for (i=0; i<n; ++i) { 27176db6d80SeopXD; for (j=0; j<m; j++) { 27276db6d80SeopXD; int *arr = ar + i * m * o + j * o; 27376db6d80SeopXD; memset(arr, 0, o * sizeof(int)); 27476db6d80SeopXD; } 27576db6d80SeopXD; } 27676db6d80SeopXD; } 277*7a752e81SNikita Popovdefine void @NestedFor32(ptr %ar, i32 %n, i32 %m, i32 %o) { 27876db6d80SeopXD; CHECK-LABEL: @NestedFor32( 27976db6d80SeopXD; CHECK-NEXT: entry: 28076db6d80SeopXD; CHECK-NEXT: [[CMP3:%.*]] = icmp slt i32 0, [[N:%.*]] 28176db6d80SeopXD; CHECK-NEXT: br i1 [[CMP3]], label [[FOR_BODY_LR_PH:%.*]], label [[FOR_END11:%.*]] 28276db6d80SeopXD; CHECK: for.body.lr.ph: 28376db6d80SeopXD; CHECK-NEXT: [[CMP21:%.*]] = icmp slt i32 0, [[M:%.*]] 28476db6d80SeopXD; CHECK-NEXT: [[CONV:%.*]] = sext i32 [[O:%.*]] to i64 28576db6d80SeopXD; CHECK-NEXT: [[MUL8:%.*]] = mul i64 [[CONV]], 4 28676db6d80SeopXD; CHECK-NEXT: br i1 [[CMP21]], label [[FOR_BODY_US_PREHEADER:%.*]], label [[FOR_END11]] 28776db6d80SeopXD; CHECK: for.body.us.preheader: 28876db6d80SeopXD; CHECK-NEXT: [[TMP0:%.*]] = sext i32 [[O]] to i64 28976db6d80SeopXD; CHECK-NEXT: [[TMP1:%.*]] = sext i32 [[M]] to i64 29076db6d80SeopXD; CHECK-NEXT: [[WIDE_TRIP_COUNT10:%.*]] = zext i32 [[N]] to i64 29176db6d80SeopXD; CHECK-NEXT: [[TMP2:%.*]] = mul i64 [[TMP0]], [[TMP1]] 292*7a752e81SNikita Popov; CHECK-NEXT: [[TMP3:%.*]] = shl i64 [[TMP2]], 2 293*7a752e81SNikita Popov; CHECK-NEXT: [[TMP4:%.*]] = zext i32 [[M]] to i64 294*7a752e81SNikita Popov; CHECK-NEXT: [[TMP5:%.*]] = mul i64 [[TMP0]], [[TMP4]] 295*7a752e81SNikita Popov; CHECK-NEXT: [[TMP6:%.*]] = shl i64 [[TMP5]], 2 296*7a752e81SNikita Popov; CHECK-NEXT: [[TMP7:%.*]] = mul i64 [[TMP5]], [[WIDE_TRIP_COUNT10]] 297*7a752e81SNikita Popov; CHECK-NEXT: [[TMP8:%.*]] = shl i64 [[TMP7]], 2 298*7a752e81SNikita Popov; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 4 [[AR:%.*]], i8 0, i64 [[TMP8]], i1 false) 299bc17d32aSeopXD; CHECK-NEXT: br label [[FOR_END11]] 30076db6d80SeopXD; CHECK: for.end11: 30176db6d80SeopXD; CHECK-NEXT: ret void 30276db6d80SeopXD; 30376db6d80SeopXDentry: 30476db6d80SeopXD %cmp3 = icmp slt i32 0, %n 30576db6d80SeopXD br i1 %cmp3, label %for.body.lr.ph, label %for.end11 30676db6d80SeopXD 30776db6d80SeopXDfor.body.lr.ph: ; preds = %entry 30876db6d80SeopXD %cmp21 = icmp slt i32 0, %m 30976db6d80SeopXD %conv = sext i32 %o to i64 31076db6d80SeopXD %mul8 = mul i64 %conv, 4 31176db6d80SeopXD br i1 %cmp21, label %for.body.us.preheader, label %for.end11 31276db6d80SeopXD 31376db6d80SeopXDfor.body.us.preheader: ; preds = %for.body.lr.ph 31476db6d80SeopXD %0 = sext i32 %o to i64 31576db6d80SeopXD %1 = sext i32 %m to i64 31676db6d80SeopXD %2 = sext i32 %o to i64 31776db6d80SeopXD %wide.trip.count10 = zext i32 %n to i64 31876db6d80SeopXD br label %for.body.us 31976db6d80SeopXD 32076db6d80SeopXDfor.body.us: ; preds = %for.body.us.preheader, %for.cond1.for.end_crit_edge.us 32176db6d80SeopXD %indvars.iv6 = phi i64 [ 0, %for.body.us.preheader ], [ %indvars.iv.next7, %for.cond1.for.end_crit_edge.us ] 32276db6d80SeopXD %3 = mul nsw i64 %indvars.iv6, %1 32376db6d80SeopXD %4 = mul nsw i64 %3, %2 324*7a752e81SNikita Popov %add.ptr.us = getelementptr inbounds i32, ptr %ar, i64 %4 32576db6d80SeopXD %wide.trip.count = zext i32 %m to i64 32676db6d80SeopXD br label %for.body3.us 32776db6d80SeopXD 32876db6d80SeopXDfor.body3.us: ; preds = %for.body.us, %for.body3.us 32976db6d80SeopXD %indvars.iv = phi i64 [ 0, %for.body.us ], [ %indvars.iv.next, %for.body3.us ] 33076db6d80SeopXD %5 = mul nsw i64 %indvars.iv, %0 331*7a752e81SNikita Popov %add.ptr7.us = getelementptr inbounds i32, ptr %add.ptr.us, i64 %5 332*7a752e81SNikita Popov call void @llvm.memset.p0.i64(ptr align 4 %add.ptr7.us, i8 0, i64 %mul8, i1 false) 33376db6d80SeopXD %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1 33476db6d80SeopXD %exitcond = icmp ne i64 %indvars.iv.next, %wide.trip.count 33576db6d80SeopXD br i1 %exitcond, label %for.body3.us, label %for.cond1.for.end_crit_edge.us 33676db6d80SeopXD 33776db6d80SeopXDfor.cond1.for.end_crit_edge.us: ; preds = %for.body3.us 33876db6d80SeopXD %indvars.iv.next7 = add nuw nsw i64 %indvars.iv6, 1 33976db6d80SeopXD %exitcond11 = icmp ne i64 %indvars.iv.next7, %wide.trip.count10 34076db6d80SeopXD br i1 %exitcond11, label %for.body.us, label %for.end11.loopexit 34176db6d80SeopXD 34276db6d80SeopXDfor.end11.loopexit: ; preds = %for.cond1.for.end_crit_edge.us 34376db6d80SeopXD br label %for.end11 34476db6d80SeopXD 34576db6d80SeopXDfor.end11: ; preds = %for.end11.loopexit, %for.body.lr.ph, %entry 34676db6d80SeopXD ret void 34776db6d80SeopXD} 34876db6d80SeopXD 349bc17d32aSeopXD; void NegStart(int n, int m, int *ar) { 350bc17d32aSeopXD; for (int i = -100; i < n; i++) { 351bc17d32aSeopXD; int *arr = ar + (i + 100) * m; 352bc17d32aSeopXD; memset(arr, 0, m * sizeof(int)); 353bc17d32aSeopXD; } 354bc17d32aSeopXD; } 355*7a752e81SNikita Popovdefine void @NegStart(i32 %n, i32 %m, ptr %ar) { 356bc17d32aSeopXD; CHECK-LABEL: @NegStart( 357bc17d32aSeopXD; CHECK-NEXT: entry: 358bc17d32aSeopXD; CHECK-NEXT: [[CMP1:%.*]] = icmp slt i32 -100, [[N:%.*]] 359bc17d32aSeopXD; CHECK-NEXT: br i1 [[CMP1]], label [[FOR_BODY_LR_PH:%.*]], label [[FOR_END:%.*]] 360bc17d32aSeopXD; CHECK: for.body.lr.ph: 361bc17d32aSeopXD; CHECK-NEXT: [[CONV:%.*]] = sext i32 [[M:%.*]] to i64 362bc17d32aSeopXD; CHECK-NEXT: [[MUL1:%.*]] = mul i64 [[CONV]], 4 363bc17d32aSeopXD; CHECK-NEXT: [[TMP0:%.*]] = sext i32 [[M]] to i64 364bc17d32aSeopXD; CHECK-NEXT: [[WIDE_TRIP_COUNT:%.*]] = sext i32 [[N]] to i64 365bc17d32aSeopXD; CHECK-NEXT: [[TMP1:%.*]] = add nsw i64 [[WIDE_TRIP_COUNT]], 100 366bc17d32aSeopXD; CHECK-NEXT: [[TMP2:%.*]] = mul i64 [[TMP1]], [[TMP0]] 367bc17d32aSeopXD; CHECK-NEXT: [[TMP3:%.*]] = shl i64 [[TMP2]], 2 368*7a752e81SNikita Popov; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 4 [[AR:%.*]], i8 0, i64 [[TMP3]], i1 false) 369bc17d32aSeopXD; CHECK-NEXT: br label [[FOR_END]] 370bc17d32aSeopXD; CHECK: for.end: 371bc17d32aSeopXD; CHECK-NEXT: ret void 372bc17d32aSeopXD; 373bc17d32aSeopXDentry: 374bc17d32aSeopXD %cmp1 = icmp slt i32 -100, %n 375bc17d32aSeopXD br i1 %cmp1, label %for.body.lr.ph, label %for.end 376bc17d32aSeopXD 377bc17d32aSeopXDfor.body.lr.ph: ; preds = %entry 378bc17d32aSeopXD %conv = sext i32 %m to i64 379bc17d32aSeopXD %mul1 = mul i64 %conv, 4 380bc17d32aSeopXD %0 = sext i32 %m to i64 381bc17d32aSeopXD %wide.trip.count = sext i32 %n to i64 382bc17d32aSeopXD br label %for.body 383bc17d32aSeopXD 384bc17d32aSeopXDfor.body: ; preds = %for.body.lr.ph, %for.body 385bc17d32aSeopXD %indvars.iv = phi i64 [ -100, %for.body.lr.ph ], [ %indvars.iv.next, %for.body ] 386bc17d32aSeopXD %1 = add nsw i64 %indvars.iv, 100 387bc17d32aSeopXD %2 = mul nsw i64 %1, %0 388*7a752e81SNikita Popov %add.ptr = getelementptr inbounds i32, ptr %ar, i64 %2 389*7a752e81SNikita Popov call void @llvm.memset.p0.i64(ptr align 4 %add.ptr, i8 0, i64 %mul1, i1 false) 390bc17d32aSeopXD %indvars.iv.next = add nsw i64 %indvars.iv, 1 391bc17d32aSeopXD %exitcond = icmp ne i64 %indvars.iv.next, %wide.trip.count 392bc17d32aSeopXD br i1 %exitcond, label %for.body, label %for.end.loopexit 393bc17d32aSeopXD 394bc17d32aSeopXDfor.end.loopexit: ; preds = %for.body 395bc17d32aSeopXD br label %for.end 396bc17d32aSeopXD 397bc17d32aSeopXDfor.end: ; preds = %for.end.loopexit, %entry 398bc17d32aSeopXD ret void 399bc17d32aSeopXD} 400bc17d32aSeopXD 401*7a752e81SNikita Popovdeclare void @llvm.memset.p0.i64(ptr nocapture writeonly, i8, i64, i1 immarg) 402