1; RUN: llc -verify-machineinstrs < %s -enable-misched -mcpu=a2 -mtriple=powerpc64-unknown-linux-gnu | FileCheck %s 2; RUN: llc -verify-machineinstrs < %s -enable-misched -enable-aa-sched-mi -mcpu=a2 -mtriple=powerpc64-unknown-linux-gnu | FileCheck %s 3target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64" 4 5@aa = external global [256 x [256 x double]], align 32 6@bb = external global [256 x [256 x double]], align 32 7@cc = external global [256 x [256 x double]], align 32 8@.str1 = external hidden unnamed_addr constant [6 x i8], align 1 9@X = external global [16000 x double], align 32 10@Y = external global [16000 x double], align 32 11@Z = external global [16000 x double], align 32 12@U = external global [16000 x double], align 32 13@V = external global [16000 x double], align 32 14@.str137 = external hidden unnamed_addr constant [14 x i8], align 1 15 16declare void @check(i32 signext) nounwind 17 18declare signext i32 @printf(ptr nocapture, ...) nounwind 19 20declare signext i32 @init(ptr) nounwind 21 22define signext i32 @s000() nounwind { 23entry: 24 %call = tail call signext i32 @init(ptr @.str1) 25 %call1 = tail call i64 @clock() nounwind 26 br label %for.cond2.preheader 27 28; CHECK: @s000 29 30for.cond2.preheader: ; preds = %for.end, %entry 31 %nl.018 = phi i32 [ 0, %entry ], [ %inc9, %for.end ] 32 br label %for.body4 33 34for.body4: ; preds = %for.body4, %for.cond2.preheader 35 %indvars.iv = phi i64 [ 0, %for.cond2.preheader ], [ %indvars.iv.next.15, %for.body4 ] 36 %arrayidx = getelementptr inbounds [16000 x double], ptr @Y, i64 0, i64 %indvars.iv 37 %arrayidx6 = getelementptr inbounds [16000 x double], ptr @X, i64 0, i64 %indvars.iv 38 %0 = load <1 x double>, ptr %arrayidx, align 32 39 %add = fadd <1 x double> %0, <double 1.000000e+00> 40 store <1 x double> %add, ptr %arrayidx6, align 32 41 %indvars.iv.next.322 = or i64 %indvars.iv, 4 42 %arrayidx.4 = getelementptr inbounds [16000 x double], ptr @Y, i64 0, i64 %indvars.iv.next.322 43 %arrayidx6.4 = getelementptr inbounds [16000 x double], ptr @X, i64 0, i64 %indvars.iv.next.322 44 %1 = load <1 x double>, ptr %arrayidx.4, align 32 45 %add.4 = fadd <1 x double> %1, <double 1.000000e+00> 46 store <1 x double> %add.4, ptr %arrayidx6.4, align 32 47 %indvars.iv.next.726 = or i64 %indvars.iv, 8 48 %arrayidx.8 = getelementptr inbounds [16000 x double], ptr @Y, i64 0, i64 %indvars.iv.next.726 49 %arrayidx6.8 = getelementptr inbounds [16000 x double], ptr @X, i64 0, i64 %indvars.iv.next.726 50 %2 = load <1 x double>, ptr %arrayidx.8, align 32 51 %add.8 = fadd <1 x double> %2, <double 1.000000e+00> 52 store <1 x double> %add.8, ptr %arrayidx6.8, align 32 53 %indvars.iv.next.1130 = or i64 %indvars.iv, 12 54 %arrayidx.12 = getelementptr inbounds [16000 x double], ptr @Y, i64 0, i64 %indvars.iv.next.1130 55 %arrayidx6.12 = getelementptr inbounds [16000 x double], ptr @X, i64 0, i64 %indvars.iv.next.1130 56 %3 = load <1 x double>, ptr %arrayidx.12, align 32 57 %add.12 = fadd <1 x double> %3, <double 1.000000e+00> 58 store <1 x double> %add.12, ptr %arrayidx6.12, align 32 59 %indvars.iv.next.15 = add i64 %indvars.iv, 16 60 %lftr.wideiv.15 = trunc i64 %indvars.iv.next.15 to i32 61 %exitcond.15 = icmp eq i32 %lftr.wideiv.15, 16000 62 br i1 %exitcond.15, label %for.end, label %for.body4 63 64; All of the loads should come before all of the stores. 65; CHECK: mtctr 66; CHECK: stfd 67; CHECK-NOT: lfd 68; CHECK: bdnz 69 70for.end: ; preds = %for.body4 71 %call7 = tail call signext i32 @dummy(ptr @X, ptr @Y, ptr @Z, ptr @U, ptr @V, ptr @aa, ptr @bb, ptr @cc, double 0.000000e+00) nounwind 72 %inc9 = add nsw i32 %nl.018, 1 73 %exitcond = icmp eq i32 %inc9, 400000 74 br i1 %exitcond, label %for.end10, label %for.cond2.preheader 75 76for.end10: ; preds = %for.end 77 %call11 = tail call i64 @clock() nounwind 78 %sub = sub nsw i64 %call11, %call1 79 %conv = sitofp i64 %sub to double 80 %div = fdiv double %conv, 1.000000e+06 81 %call12 = tail call signext i32 (ptr, ...) @printf(ptr @.str137, double %div) nounwind 82 tail call void @check(i32 signext 1) 83 ret i32 0 84} 85 86declare i64 @clock() nounwind 87 88declare signext i32 @dummy(ptr, ptr, ptr, ptr, ptr, ptr, ptr, ptr, double) 89