1df7eb202SAlexey Bataev; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4 2df7eb202SAlexey Bataev; RUN: opt -S --passes=slp-vectorizer -mtriple=riscv64-unknown-linux -mattr=+v < %s | FileCheck %s 3df7eb202SAlexey Bataev 4df7eb202SAlexey Bataevdefine void @test(ptr %p, i16 %load794) { 5df7eb202SAlexey Bataev; CHECK-LABEL: define void @test( 6df7eb202SAlexey Bataev; CHECK-SAME: ptr [[P:%.*]], i16 [[LOAD794:%.*]]) #[[ATTR0:[0-9]+]] { 7df7eb202SAlexey Bataev; CHECK-NEXT: [[ZEXT795:%.*]] = zext i16 [[LOAD794]] to i32 8df7eb202SAlexey Bataev; CHECK-NEXT: [[GEP799:%.*]] = getelementptr inbounds i8, ptr [[P]], i64 16 9df7eb202SAlexey Bataev; CHECK-NEXT: [[TMP1:%.*]] = load <2 x i16>, ptr [[P]], align 2 10df7eb202SAlexey Bataev; CHECK-NEXT: [[TMP2:%.*]] = load <2 x i16>, ptr [[GEP799]], align 2 114d7f3d9eSAlexey Bataev; CHECK-NEXT: [[TMP3:%.*]] = zext <2 x i16> [[TMP1]] to <2 x i32> 124d7f3d9eSAlexey Bataev; CHECK-NEXT: [[TMP4:%.*]] = zext <2 x i16> [[TMP2]] to <2 x i32> 134d7f3d9eSAlexey Bataev; CHECK-NEXT: [[TMP7:%.*]] = sub nsw <2 x i32> [[TMP4]], [[TMP3]] 14*38fffa63SPaul Walker; CHECK-NEXT: [[TMP8:%.*]] = add nsw <2 x i32> [[TMP7]], splat (i32 3329) 15df7eb202SAlexey Bataev; CHECK-NEXT: [[TMP5:%.*]] = insertelement <2 x i32> poison, i32 [[ZEXT795]], i32 0 16df7eb202SAlexey Bataev; CHECK-NEXT: [[TMP6:%.*]] = shufflevector <2 x i32> [[TMP5]], <2 x i32> poison, <2 x i32> zeroinitializer 174d7f3d9eSAlexey Bataev; CHECK-NEXT: [[TMP12:%.*]] = mul <2 x i32> [[TMP8]], [[TMP6]] 184d7f3d9eSAlexey Bataev; CHECK-NEXT: [[TMP9:%.*]] = zext <2 x i32> [[TMP12]] to <2 x i64> 19*38fffa63SPaul Walker; CHECK-NEXT: [[TMP22:%.*]] = mul nuw nsw <2 x i64> [[TMP9]], splat (i64 5039) 20*38fffa63SPaul Walker; CHECK-NEXT: [[TMP11:%.*]] = lshr <2 x i64> [[TMP22]], splat (i64 24) 214d7f3d9eSAlexey Bataev; CHECK-NEXT: [[TMP13:%.*]] = trunc <2 x i64> [[TMP11]] to <2 x i32> 22*38fffa63SPaul Walker; CHECK-NEXT: [[TMP20:%.*]] = mul <2 x i32> [[TMP13]], splat (i32 62207) 234d7f3d9eSAlexey Bataev; CHECK-NEXT: [[TMP21:%.*]] = add <2 x i32> [[TMP20]], [[TMP12]] 244d7f3d9eSAlexey Bataev; CHECK-NEXT: [[TMP14:%.*]] = trunc <2 x i32> [[TMP21]] to <2 x i16> 25*38fffa63SPaul Walker; CHECK-NEXT: [[TMP15:%.*]] = add <2 x i16> [[TMP14]], splat (i16 -3329) 26df7eb202SAlexey Bataev; CHECK-NEXT: [[TMP16:%.*]] = icmp slt <2 x i16> [[TMP15]], zeroinitializer 27df7eb202SAlexey Bataev; CHECK-NEXT: [[TMP17:%.*]] = select <2 x i1> [[TMP16]], <2 x i16> [[TMP14]], <2 x i16> zeroinitializer 28df7eb202SAlexey Bataev; CHECK-NEXT: [[TMP18:%.*]] = call <2 x i16> @llvm.smax.v2i16(<2 x i16> [[TMP15]], <2 x i16> zeroinitializer) 29df7eb202SAlexey Bataev; CHECK-NEXT: [[TMP19:%.*]] = or <2 x i16> [[TMP17]], [[TMP18]] 30df7eb202SAlexey Bataev; CHECK-NEXT: store <2 x i16> [[TMP19]], ptr [[P]], align 2 31df7eb202SAlexey Bataev; CHECK-NEXT: ret void 32df7eb202SAlexey Bataev; 33df7eb202SAlexey Bataev %zext795 = zext i16 %load794 to i32 34df7eb202SAlexey Bataev %load798 = load i16, ptr %p, align 2 35df7eb202SAlexey Bataev %gep799 = getelementptr inbounds i8, ptr %p, i64 16 36df7eb202SAlexey Bataev %load800 = load i16, ptr %gep799, align 2 37df7eb202SAlexey Bataev %zext801 = zext i16 %load798 to i32 38df7eb202SAlexey Bataev %zext802 = zext i16 %load800 to i32 39df7eb202SAlexey Bataev %sub809 = sub nsw i32 %zext802, %zext801 40df7eb202SAlexey Bataev %add810 = add nsw i32 %sub809, 3329 41df7eb202SAlexey Bataev %mul811 = mul i32 %add810, %zext795 42df7eb202SAlexey Bataev %zext812 = zext i32 %mul811 to i64 43df7eb202SAlexey Bataev %mul813 = mul nuw nsw i64 %zext812, 5039 44df7eb202SAlexey Bataev %lshr814 = lshr i64 %mul813, 24 45df7eb202SAlexey Bataev %trunc815 = trunc nuw nsw i64 %lshr814 to i32 46df7eb202SAlexey Bataev %mul816 = mul i32 %trunc815, 62207 47df7eb202SAlexey Bataev %add817 = add i32 %mul816, %mul811 48df7eb202SAlexey Bataev %trunc818 = trunc i32 %add817 to i16 49df7eb202SAlexey Bataev %add819 = add i16 %trunc818, -3329 50df7eb202SAlexey Bataev %icmp820 = icmp slt i16 %add819, 0 51df7eb202SAlexey Bataev %select821 = select i1 %icmp820, i16 %trunc818, i16 0 52df7eb202SAlexey Bataev %call822 = call i16 @llvm.smax.i16(i16 %add819, i16 0) 53df7eb202SAlexey Bataev %or823 = or i16 %select821, %call822 54df7eb202SAlexey Bataev store i16 %or823, ptr %p, align 2 55df7eb202SAlexey Bataev %gep826 = getelementptr inbounds i8, ptr %p, i64 2 56df7eb202SAlexey Bataev %load827 = load i16, ptr %gep826, align 2 57df7eb202SAlexey Bataev %gep828 = getelementptr inbounds i8, ptr %p, i64 18 58df7eb202SAlexey Bataev %load829 = load i16, ptr %gep828, align 2 59df7eb202SAlexey Bataev %zext830 = zext i16 %load827 to i32 60df7eb202SAlexey Bataev %zext831 = zext i16 %load829 to i32 61df7eb202SAlexey Bataev %sub838 = sub nsw i32 %zext831, %zext830 62df7eb202SAlexey Bataev %add839 = add nsw i32 %sub838, 3329 63df7eb202SAlexey Bataev %mul840 = mul i32 %add839, %zext795 64df7eb202SAlexey Bataev %zext841 = zext i32 %mul840 to i64 65df7eb202SAlexey Bataev %mul842 = mul nuw nsw i64 %zext841, 5039 66df7eb202SAlexey Bataev %lshr843 = lshr i64 %mul842, 24 67df7eb202SAlexey Bataev %trunc844 = trunc nuw nsw i64 %lshr843 to i32 68df7eb202SAlexey Bataev %mul845 = mul i32 %trunc844, 62207 69df7eb202SAlexey Bataev %add846 = add i32 %mul845, %mul840 70df7eb202SAlexey Bataev %trunc847 = trunc i32 %add846 to i16 71df7eb202SAlexey Bataev %add848 = add i16 %trunc847, -3329 72df7eb202SAlexey Bataev %icmp849 = icmp slt i16 %add848, 0 73df7eb202SAlexey Bataev %select850 = select i1 %icmp849, i16 %trunc847, i16 0 74df7eb202SAlexey Bataev %call851 = call i16 @llvm.smax.i16(i16 %add848, i16 0) 75df7eb202SAlexey Bataev %or852 = or i16 %select850, %call851 76df7eb202SAlexey Bataev store i16 %or852, ptr %gep826, align 2 77df7eb202SAlexey Bataev ret void 78df7eb202SAlexey Bataev} 79df7eb202SAlexey Bataev 80