1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2 2; RUN: opt -S -passes=slp-vectorizer -mtriple=x86_64-unknown-linux -debug-counter=slp-vectorized=0 -slp-threshold=-99999 < %s | FileCheck %s --check-prefix=COUNT0 3; RUN: opt -S -passes=slp-vectorizer -mtriple=x86_64-unknown-linux -debug-counter=slp-vectorized=1 -slp-threshold=-99999 < %s | FileCheck %s --check-prefix=COUNT1 4; RUN: opt -S -passes=slp-vectorizer -mtriple=x86_64-unknown-linux -debug-counter=slp-vectorized=2 -slp-threshold=-99999 < %s | FileCheck %s --check-prefix=COUNT2 5; RUN: opt -S -passes=slp-vectorizer -mtriple=x86_64-unknown-linux -debug-counter=slp-vectorized=0-1 -slp-threshold=-99999 < %s | FileCheck %s --check-prefix=COUNT-1 6; REQUIRES: asserts 7 8define void @blam(ptr %arg, double %load2, i1 %fcmp3) { 9; COUNT0-LABEL: define void @blam 10; COUNT0-SAME: (ptr [[ARG:%.*]], double [[LOAD2:%.*]], i1 [[FCMP3:%.*]]) { 11; COUNT0-NEXT: bb: 12; COUNT0-NEXT: [[GETELEMENTPTR13:%.*]] = getelementptr double, ptr [[ARG]], i64 3 13; COUNT0-NEXT: [[TMP0:%.*]] = load <2 x double>, ptr [[ARG]], align 8 14; COUNT0-NEXT: [[TMP1:%.*]] = insertelement <2 x i1> poison, i1 [[FCMP3]], i32 0 15; COUNT0-NEXT: [[TMP2:%.*]] = shufflevector <2 x i1> [[TMP1]], <2 x i1> poison, <2 x i32> zeroinitializer 16; COUNT0-NEXT: [[TMP3:%.*]] = select <2 x i1> [[TMP2]], <2 x double> zeroinitializer, <2 x double> [[TMP0]] 17; COUNT0-NEXT: [[TMP4:%.*]] = insertelement <2 x double> [[TMP0]], double [[LOAD2]], i32 0 18; COUNT0-NEXT: [[TMP5:%.*]] = fcmp olt <2 x double> [[TMP4]], zeroinitializer 19; COUNT0-NEXT: [[TMP6:%.*]] = select <2 x i1> [[TMP5]], <2 x double> zeroinitializer, <2 x double> [[TMP0]] 20; COUNT0-NEXT: [[TMP7:%.*]] = fcmp olt <2 x double> [[TMP3]], zeroinitializer 21; COUNT0-NEXT: [[TMP8:%.*]] = select <2 x i1> [[TMP7]], <2 x double> <double 0.000000e+00, double 1.000000e+00>, <2 x double> <double 1.000000e+00, double 0.000000e+00> 22; COUNT0-NEXT: [[TMP9:%.*]] = shufflevector <2 x double> [[TMP8]], <2 x double> poison, <2 x i32> <i32 1, i32 0> 23; COUNT0-NEXT: [[TMP10:%.*]] = fcmp olt <2 x double> [[TMP9]], [[TMP6]] 24; COUNT0-NEXT: [[TMP11:%.*]] = shufflevector <2 x double> [[TMP4]], <2 x double> <double poison, double 0.000000e+00>, <2 x i32> <i32 0, i32 3> 25; COUNT0-NEXT: [[TMP12:%.*]] = shufflevector <2 x double> [[TMP4]], <2 x double> <double 0.000000e+00, double poison>, <2 x i32> <i32 2, i32 0> 26; COUNT0-NEXT: [[TMP13:%.*]] = select <2 x i1> [[TMP10]], <2 x double> [[TMP11]], <2 x double> [[TMP12]] 27; COUNT0-NEXT: [[TMP14:%.*]] = fcmp olt <2 x double> [[TMP13]], zeroinitializer 28; COUNT0-NEXT: [[TMP15:%.*]] = select <2 x i1> [[TMP14]], <2 x double> zeroinitializer, <2 x double> splat (double 1.000000e+00) 29; COUNT0-NEXT: [[TMP16:%.*]] = fcmp ogt <2 x double> [[TMP15]], zeroinitializer 30; COUNT0-NEXT: [[TMP17:%.*]] = shufflevector <2 x double> [[TMP4]], <2 x double> poison, <2 x i32> zeroinitializer 31; COUNT0-NEXT: [[TMP18:%.*]] = select <2 x i1> [[TMP16]], <2 x double> zeroinitializer, <2 x double> [[TMP17]] 32; COUNT0-NEXT: [[TMP19:%.*]] = fcmp olt <2 x double> [[TMP18]], zeroinitializer 33; COUNT0-NEXT: [[TMP20:%.*]] = select <2 x i1> [[TMP19]], <2 x double> splat (double 1.000000e+00), <2 x double> zeroinitializer 34; COUNT0-NEXT: store <2 x double> [[TMP20]], ptr [[GETELEMENTPTR13]], align 8 35; COUNT0-NEXT: ret void 36; 37; COUNT1-LABEL: define void @blam 38; COUNT1-SAME: (ptr [[ARG:%.*]], double [[LOAD2:%.*]], i1 [[FCMP3:%.*]]) { 39; COUNT1-NEXT: bb: 40; COUNT1-NEXT: [[GETELEMENTPTR:%.*]] = getelementptr double, ptr [[ARG]], i64 1 41; COUNT1-NEXT: [[LOAD:%.*]] = load double, ptr [[GETELEMENTPTR]], align 8 42; COUNT1-NEXT: [[FCMP:%.*]] = fcmp olt double [[LOAD]], 0.000000e+00 43; COUNT1-NEXT: [[SELECT3:%.*]] = select i1 [[FCMP]], double 0.000000e+00, double [[LOAD]] 44; COUNT1-NEXT: [[SELECT4:%.*]] = select i1 [[FCMP3]], double 0.000000e+00, double [[LOAD]] 45; COUNT1-NEXT: [[LOAD7:%.*]] = load double, ptr [[ARG]], align 8 46; COUNT1-NEXT: [[SELECT10:%.*]] = select i1 [[FCMP3]], double 0.000000e+00, double [[LOAD7]] 47; COUNT1-NEXT: [[GETELEMENTPTR13:%.*]] = getelementptr double, ptr [[ARG]], i64 3 48; COUNT1-NEXT: [[GETELEMENTPTR21:%.*]] = getelementptr double, ptr [[ARG]], i64 4 49; COUNT1-NEXT: [[FCMP23:%.*]] = fcmp olt double [[SELECT10]], 0.000000e+00 50; COUNT1-NEXT: [[SELECT24:%.*]] = select i1 [[FCMP23]], double 0.000000e+00, double 1.000000e+00 51; COUNT1-NEXT: [[TMP0:%.*]] = insertelement <2 x double> poison, double [[LOAD2]], i32 1 52; COUNT1-NEXT: [[TMP1:%.*]] = insertelement <2 x double> [[TMP0]], double [[SELECT4]], i32 0 53; COUNT1-NEXT: [[TMP2:%.*]] = fcmp olt <2 x double> [[TMP1]], zeroinitializer 54; COUNT1-NEXT: [[TMP3:%.*]] = insertelement <2 x double> <double 0.000000e+00, double poison>, double [[LOAD7]], i32 1 55; COUNT1-NEXT: [[TMP4:%.*]] = select <2 x i1> [[TMP2]], <2 x double> <double 1.000000e+00, double 0.000000e+00>, <2 x double> [[TMP3]] 56; COUNT1-NEXT: [[FCMP33:%.*]] = fcmp olt double [[SELECT24]], [[SELECT3]] 57; COUNT1-NEXT: [[SELECT34:%.*]] = select i1 [[FCMP33]], double 0.000000e+00, double [[LOAD2]] 58; COUNT1-NEXT: [[TMP5:%.*]] = extractelement <2 x double> [[TMP4]], i32 0 59; COUNT1-NEXT: [[TMP6:%.*]] = extractelement <2 x double> [[TMP4]], i32 1 60; COUNT1-NEXT: [[FCMP39:%.*]] = fcmp olt double [[TMP5]], [[TMP6]] 61; COUNT1-NEXT: [[SELECT40:%.*]] = select i1 [[FCMP39]], double [[LOAD2]], double 0.000000e+00 62; COUNT1-NEXT: [[FCMP62:%.*]] = fcmp olt double [[SELECT34]], 0.000000e+00 63; COUNT1-NEXT: [[SELECT639:%.*]] = select i1 [[FCMP62]], double 0.000000e+00, double 1.000000e+00 64; COUNT1-NEXT: [[FCMP76:%.*]] = fcmp olt double [[SELECT40]], 0.000000e+00 65; COUNT1-NEXT: [[SELECT77:%.*]] = select i1 [[FCMP76]], double 0.000000e+00, double 1.000000e+00 66; COUNT1-NEXT: [[FCMP90:%.*]] = fcmp ogt double [[SELECT639]], 0.000000e+00 67; COUNT1-NEXT: [[SELECT91:%.*]] = select i1 [[FCMP90]], double 0.000000e+00, double [[LOAD2]] 68; COUNT1-NEXT: [[FCMP92:%.*]] = fcmp ogt double [[SELECT77]], 0.000000e+00 69; COUNT1-NEXT: [[SELECT93:%.*]] = select i1 [[FCMP92]], double 0.000000e+00, double [[LOAD2]] 70; COUNT1-NEXT: [[FCMP108:%.*]] = fcmp olt double [[SELECT93]], 0.000000e+00 71; COUNT1-NEXT: [[SELECT109:%.*]] = select i1 [[FCMP108]], double 1.000000e+00, double 0.000000e+00 72; COUNT1-NEXT: [[FCMP110:%.*]] = fcmp olt double [[SELECT91]], 0.000000e+00 73; COUNT1-NEXT: [[SELECT111:%.*]] = select i1 [[FCMP110]], double 1.000000e+00, double 0.000000e+00 74; COUNT1-NEXT: store double [[SELECT111]], ptr [[GETELEMENTPTR21]], align 8 75; COUNT1-NEXT: store double [[SELECT109]], ptr [[GETELEMENTPTR13]], align 8 76; COUNT1-NEXT: ret void 77; 78; COUNT2-LABEL: define void @blam 79; COUNT2-SAME: (ptr [[ARG:%.*]], double [[LOAD2:%.*]], i1 [[FCMP3:%.*]]) { 80; COUNT2-NEXT: bb: 81; COUNT2-NEXT: [[GETELEMENTPTR:%.*]] = getelementptr double, ptr [[ARG]], i64 1 82; COUNT2-NEXT: [[LOAD:%.*]] = load double, ptr [[GETELEMENTPTR]], align 8 83; COUNT2-NEXT: [[SELECT4:%.*]] = select i1 [[FCMP3]], double 0.000000e+00, double [[LOAD]] 84; COUNT2-NEXT: [[LOAD7:%.*]] = load double, ptr [[ARG]], align 8 85; COUNT2-NEXT: [[SELECT10:%.*]] = select i1 [[FCMP3]], double 0.000000e+00, double [[LOAD7]] 86; COUNT2-NEXT: [[FCMP11:%.*]] = fcmp olt double [[LOAD2]], 0.000000e+00 87; COUNT2-NEXT: [[SELECT128:%.*]] = select i1 [[FCMP11]], double 0.000000e+00, double [[LOAD7]] 88; COUNT2-NEXT: [[GETELEMENTPTR13:%.*]] = getelementptr double, ptr [[ARG]], i64 3 89; COUNT2-NEXT: [[GETELEMENTPTR21:%.*]] = getelementptr double, ptr [[ARG]], i64 4 90; COUNT2-NEXT: [[TMP0:%.*]] = insertelement <2 x double> poison, double [[SELECT10]], i32 0 91; COUNT2-NEXT: [[TMP1:%.*]] = insertelement <2 x double> [[TMP0]], double [[LOAD]], i32 1 92; COUNT2-NEXT: [[TMP2:%.*]] = fcmp olt <2 x double> [[TMP1]], zeroinitializer 93; COUNT2-NEXT: [[TMP3:%.*]] = shufflevector <2 x double> [[TMP1]], <2 x double> <double 1.000000e+00, double poison>, <2 x i32> <i32 2, i32 1> 94; COUNT2-NEXT: [[TMP4:%.*]] = select <2 x i1> [[TMP2]], <2 x double> zeroinitializer, <2 x double> [[TMP3]] 95; COUNT2-NEXT: [[FCMP29:%.*]] = fcmp olt double [[SELECT4]], 0.000000e+00 96; COUNT2-NEXT: [[SELECT30:%.*]] = select i1 [[FCMP29]], double 1.000000e+00, double 0.000000e+00 97; COUNT2-NEXT: [[TMP5:%.*]] = extractelement <2 x double> [[TMP4]], i32 0 98; COUNT2-NEXT: [[TMP6:%.*]] = extractelement <2 x double> [[TMP4]], i32 1 99; COUNT2-NEXT: [[FCMP33:%.*]] = fcmp olt double [[TMP5]], [[TMP6]] 100; COUNT2-NEXT: [[SELECT34:%.*]] = select i1 [[FCMP33]], double 0.000000e+00, double [[LOAD2]] 101; COUNT2-NEXT: [[FCMP39:%.*]] = fcmp olt double [[SELECT30]], [[SELECT128]] 102; COUNT2-NEXT: [[SELECT40:%.*]] = select i1 [[FCMP39]], double [[LOAD2]], double 0.000000e+00 103; COUNT2-NEXT: [[FCMP62:%.*]] = fcmp olt double [[SELECT34]], 0.000000e+00 104; COUNT2-NEXT: [[SELECT639:%.*]] = select i1 [[FCMP62]], double 0.000000e+00, double 1.000000e+00 105; COUNT2-NEXT: [[FCMP76:%.*]] = fcmp olt double [[SELECT40]], 0.000000e+00 106; COUNT2-NEXT: [[SELECT77:%.*]] = select i1 [[FCMP76]], double 0.000000e+00, double 1.000000e+00 107; COUNT2-NEXT: [[FCMP90:%.*]] = fcmp ogt double [[SELECT639]], 0.000000e+00 108; COUNT2-NEXT: [[SELECT91:%.*]] = select i1 [[FCMP90]], double 0.000000e+00, double [[LOAD2]] 109; COUNT2-NEXT: [[FCMP92:%.*]] = fcmp ogt double [[SELECT77]], 0.000000e+00 110; COUNT2-NEXT: [[SELECT93:%.*]] = select i1 [[FCMP92]], double 0.000000e+00, double [[LOAD2]] 111; COUNT2-NEXT: [[FCMP108:%.*]] = fcmp olt double [[SELECT93]], 0.000000e+00 112; COUNT2-NEXT: [[SELECT109:%.*]] = select i1 [[FCMP108]], double 1.000000e+00, double 0.000000e+00 113; COUNT2-NEXT: [[FCMP110:%.*]] = fcmp olt double [[SELECT91]], 0.000000e+00 114; COUNT2-NEXT: [[SELECT111:%.*]] = select i1 [[FCMP110]], double 1.000000e+00, double 0.000000e+00 115; COUNT2-NEXT: store double [[SELECT111]], ptr [[GETELEMENTPTR21]], align 8 116; COUNT2-NEXT: store double [[SELECT109]], ptr [[GETELEMENTPTR13]], align 8 117; COUNT2-NEXT: ret void 118; 119; COUNT-1-LABEL: define void @blam 120; COUNT-1-SAME: (ptr [[ARG:%.*]], double [[LOAD2:%.*]], i1 [[FCMP3:%.*]]) { 121; COUNT-1-NEXT: bb: 122; COUNT-1-NEXT: [[GETELEMENTPTR13:%.*]] = getelementptr double, ptr [[ARG]], i64 3 123; COUNT-1-NEXT: [[TMP0:%.*]] = load <2 x double>, ptr [[ARG]], align 8 124; COUNT-1-NEXT: [[TMP1:%.*]] = insertelement <2 x i1> poison, i1 [[FCMP3]], i32 0 125; COUNT-1-NEXT: [[TMP2:%.*]] = shufflevector <2 x i1> [[TMP1]], <2 x i1> poison, <2 x i32> zeroinitializer 126; COUNT-1-NEXT: [[TMP3:%.*]] = select <2 x i1> [[TMP2]], <2 x double> zeroinitializer, <2 x double> [[TMP0]] 127; COUNT-1-NEXT: [[TMP4:%.*]] = insertelement <2 x double> [[TMP0]], double [[LOAD2]], i32 0 128; COUNT-1-NEXT: [[TMP5:%.*]] = fcmp olt <2 x double> [[TMP4]], zeroinitializer 129; COUNT-1-NEXT: [[TMP6:%.*]] = select <2 x i1> [[TMP5]], <2 x double> zeroinitializer, <2 x double> [[TMP0]] 130; COUNT-1-NEXT: [[TMP7:%.*]] = fcmp olt <2 x double> [[TMP3]], zeroinitializer 131; COUNT-1-NEXT: [[TMP8:%.*]] = select <2 x i1> [[TMP7]], <2 x double> <double 0.000000e+00, double 1.000000e+00>, <2 x double> <double 1.000000e+00, double 0.000000e+00> 132; COUNT-1-NEXT: [[TMP9:%.*]] = shufflevector <2 x double> [[TMP8]], <2 x double> poison, <2 x i32> <i32 1, i32 0> 133; COUNT-1-NEXT: [[TMP10:%.*]] = fcmp olt <2 x double> [[TMP9]], [[TMP6]] 134; COUNT-1-NEXT: [[TMP11:%.*]] = shufflevector <2 x double> [[TMP4]], <2 x double> <double poison, double 0.000000e+00>, <2 x i32> <i32 0, i32 3> 135; COUNT-1-NEXT: [[TMP12:%.*]] = shufflevector <2 x double> [[TMP4]], <2 x double> <double 0.000000e+00, double poison>, <2 x i32> <i32 2, i32 0> 136; COUNT-1-NEXT: [[TMP13:%.*]] = select <2 x i1> [[TMP10]], <2 x double> [[TMP11]], <2 x double> [[TMP12]] 137; COUNT-1-NEXT: [[TMP14:%.*]] = fcmp olt <2 x double> [[TMP13]], zeroinitializer 138; COUNT-1-NEXT: [[TMP15:%.*]] = select <2 x i1> [[TMP14]], <2 x double> zeroinitializer, <2 x double> splat (double 1.000000e+00) 139; COUNT-1-NEXT: [[TMP16:%.*]] = fcmp ogt <2 x double> [[TMP15]], zeroinitializer 140; COUNT-1-NEXT: [[TMP17:%.*]] = shufflevector <2 x double> [[TMP4]], <2 x double> poison, <2 x i32> zeroinitializer 141; COUNT-1-NEXT: [[TMP18:%.*]] = select <2 x i1> [[TMP16]], <2 x double> zeroinitializer, <2 x double> [[TMP17]] 142; COUNT-1-NEXT: [[TMP19:%.*]] = fcmp olt <2 x double> [[TMP18]], zeroinitializer 143; COUNT-1-NEXT: [[TMP20:%.*]] = select <2 x i1> [[TMP19]], <2 x double> splat (double 1.000000e+00), <2 x double> zeroinitializer 144; COUNT-1-NEXT: store <2 x double> [[TMP20]], ptr [[GETELEMENTPTR13]], align 8 145; COUNT-1-NEXT: ret void 146; 147bb: 148 %getelementptr = getelementptr double, ptr %arg, i64 1 149 %load = load double, ptr %getelementptr, align 8 150 %fcmp = fcmp olt double %load, 0.000000e+00 151 %select3 = select i1 %fcmp, double 0.000000e+00, double %load 152 %select4 = select i1 %fcmp3, double 0.000000e+00, double %load 153 %load7 = load double, ptr %arg, align 8 154 %select10 = select i1 %fcmp3, double 0.000000e+00, double %load7 155 %fcmp11 = fcmp olt double %load2, 0.000000e+00 156 %select128 = select i1 %fcmp11, double 0.000000e+00, double %load7 157 %getelementptr13 = getelementptr double, ptr %arg, i64 3 158 %getelementptr21 = getelementptr double, ptr %arg, i64 4 159 %fcmp23 = fcmp olt double %select10, 0.000000e+00 160 %select24 = select i1 %fcmp23, double 0.000000e+00, double 1.000000e+00 161 %fcmp29 = fcmp olt double %select4, 0.000000e+00 162 %select30 = select i1 %fcmp29, double 1.000000e+00, double 0.000000e+00 163 %fcmp33 = fcmp olt double %select24, %select3 164 %select34 = select i1 %fcmp33, double 0.000000e+00, double %load2 165 %fcmp39 = fcmp olt double %select30, %select128 166 %select40 = select i1 %fcmp39, double %load2, double 0.000000e+00 167 %fcmp62 = fcmp olt double %select34, 0.000000e+00 168 %select639 = select i1 %fcmp62, double 0.000000e+00, double 1.000000e+00 169 %fcmp76 = fcmp olt double %select40, 0.000000e+00 170 %select77 = select i1 %fcmp76, double 0.000000e+00, double 1.000000e+00 171 %fcmp90 = fcmp ogt double %select639, 0.000000e+00 172 %select91 = select i1 %fcmp90, double 0.000000e+00, double %load2 173 %fcmp92 = fcmp ogt double %select77, 0.000000e+00 174 %select93 = select i1 %fcmp92, double 0.000000e+00, double %load2 175 %fcmp108 = fcmp olt double %select93, 0.000000e+00 176 %select109 = select i1 %fcmp108, double 1.000000e+00, double 0.000000e+00 177 %fcmp110 = fcmp olt double %select91, 0.000000e+00 178 %select111 = select i1 %fcmp110, double 1.000000e+00, double 0.000000e+00 179 store double %select111, ptr %getelementptr21, align 8 180 store double %select109, ptr %getelementptr13, align 8 181 ret void 182} 183