1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py 2; RUN: opt -mtriple=thumbv8.1m.main-none-none-eabi -mattr=+mve.fp < %s -codegenprepare -S | FileCheck -check-prefix=CHECK %s 3; RUN: opt -mtriple=thumbv8.1m.main-none-none-eabi -mattr=+mve.fp < %s -codegenprepare -cgpp-huge-func=0 -S | FileCheck -check-prefix=CHECK %s 4 5; Sink the shufflevector/insertelement pair, followed by the trunc. The sunk instruction end up dead. 6define signext i8 @dead(ptr noalias nocapture readonly %s1, i16 zeroext %x, ptr noalias nocapture %d, i32 %n) { 7; CHECK-LABEL: @dead( 8; CHECK-NEXT: entry: 9; CHECK-NEXT: [[N_VEC:%.*]] = and i32 [[N:%.*]], -8 10; CHECK-NEXT: br label [[VECTOR_BODY:%.*]] 11; CHECK: vector.body: 12; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ] 13; CHECK-NEXT: [[TMP0:%.*]] = trunc i16 [[X:%.*]] to i8 14; CHECK-NEXT: [[L6:%.*]] = getelementptr inbounds i16, ptr [[S1:%.*]], i32 [[INDEX]] 15; CHECK-NEXT: [[WIDE_LOAD:%.*]] = load <8 x i16>, ptr [[L6]], align 2 16; CHECK-NEXT: [[L8:%.*]] = trunc <8 x i16> [[WIDE_LOAD]] to <8 x i8> 17; CHECK-NEXT: [[TMP1:%.*]] = insertelement <8 x i8> undef, i8 [[TMP0]], i32 0 18; CHECK-NEXT: [[TMP2:%.*]] = shufflevector <8 x i8> [[TMP1]], <8 x i8> undef, <8 x i32> zeroinitializer 19; CHECK-NEXT: [[L9:%.*]] = mul <8 x i8> [[TMP2]], [[L8]] 20; CHECK-NEXT: [[L13:%.*]] = getelementptr inbounds i8, ptr [[D:%.*]], i32 [[INDEX]] 21; CHECK-NEXT: store <8 x i8> [[L9]], ptr [[L13]], align 1 22; CHECK-NEXT: [[INDEX_NEXT]] = add i32 [[INDEX]], 8 23; CHECK-NEXT: [[L15:%.*]] = icmp eq i32 [[INDEX_NEXT]], [[N_VEC]] 24; CHECK-NEXT: br i1 [[L15]], label [[EXIT:%.*]], label [[VECTOR_BODY]] 25; CHECK: exit: 26; CHECK-NEXT: ret i8 0 27; 28entry: 29 %n.vec = and i32 %n, -8 30 %l0 = trunc i16 %x to i8 31 %l1 = insertelement <8 x i8> undef, i8 %l0, i32 0 32 %broadcast.splat26 = shufflevector <8 x i8> %l1, <8 x i8> undef, <8 x i32> zeroinitializer 33 br label %vector.body 34 35vector.body: ; preds = %vector.body, %entry 36 %index = phi i32 [ 0, %entry ], [ %index.next, %vector.body ] 37 %l6 = getelementptr inbounds i16, ptr %s1, i32 %index 38 %wide.load = load <8 x i16>, ptr %l6, align 2 39 %l8 = trunc <8 x i16> %wide.load to <8 x i8> 40 %l9 = mul <8 x i8> %broadcast.splat26, %l8 41 %l13 = getelementptr inbounds i8, ptr %d, i32 %index 42 store <8 x i8> %l9, ptr %l13, align 1 43 %index.next = add i32 %index, 8 44 %l15 = icmp eq i32 %index.next, %n.vec 45 br i1 %l15, label %exit, label %vector.body 46 47exit: ; preds = %vector.body 48 ret i8 0 49} 50 51; Same as above, but the shuffle has an extra use meaning it shouldnt be deleted 52define signext i8 @alive(ptr noalias nocapture readonly %s1, i16 zeroext %x, ptr noalias nocapture %d, i32 %n) { 53; CHECK-LABEL: @alive( 54; CHECK-NEXT: entry: 55; CHECK-NEXT: [[N_VEC:%.*]] = and i32 [[N:%.*]], -8 56; CHECK-NEXT: [[L0:%.*]] = trunc i16 [[X:%.*]] to i8 57; CHECK-NEXT: [[L1:%.*]] = insertelement <8 x i8> undef, i8 [[L0]], i32 0 58; CHECK-NEXT: [[BROADCAST_SPLAT26:%.*]] = shufflevector <8 x i8> [[L1]], <8 x i8> undef, <8 x i32> zeroinitializer 59; CHECK-NEXT: [[L2:%.*]] = sub <8 x i8> zeroinitializer, [[BROADCAST_SPLAT26]] 60; CHECK-NEXT: br label [[VECTOR_BODY:%.*]] 61; CHECK: vector.body: 62; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ] 63; CHECK-NEXT: [[TMP0:%.*]] = trunc i16 [[X]] to i8 64; CHECK-NEXT: [[L6:%.*]] = getelementptr inbounds i16, ptr [[S1:%.*]], i32 [[INDEX]] 65; CHECK-NEXT: [[WIDE_LOAD:%.*]] = load <8 x i16>, ptr [[L6]], align 2 66; CHECK-NEXT: [[L8:%.*]] = trunc <8 x i16> [[WIDE_LOAD]] to <8 x i8> 67; CHECK-NEXT: [[TMP1:%.*]] = insertelement <8 x i8> undef, i8 [[TMP0]], i32 0 68; CHECK-NEXT: [[TMP2:%.*]] = shufflevector <8 x i8> [[TMP1]], <8 x i8> undef, <8 x i32> zeroinitializer 69; CHECK-NEXT: [[L9:%.*]] = mul <8 x i8> [[TMP2]], [[L8]] 70; CHECK-NEXT: [[L13:%.*]] = getelementptr inbounds i8, ptr [[D:%.*]], i32 [[INDEX]] 71; CHECK-NEXT: store <8 x i8> [[L9]], ptr [[L13]], align 1 72; CHECK-NEXT: [[INDEX_NEXT]] = add i32 [[INDEX]], 8 73; CHECK-NEXT: [[L15:%.*]] = icmp eq i32 [[INDEX_NEXT]], [[N_VEC]] 74; CHECK-NEXT: br i1 [[L15]], label [[EXIT:%.*]], label [[VECTOR_BODY]] 75; CHECK: exit: 76; CHECK-NEXT: ret i8 0 77; 78entry: 79 %n.vec = and i32 %n, -8 80 %l0 = trunc i16 %x to i8 81 %l1 = insertelement <8 x i8> undef, i8 %l0, i32 0 82 %broadcast.splat26 = shufflevector <8 x i8> %l1, <8 x i8> undef, <8 x i32> zeroinitializer 83 %l2 = sub <8 x i8> zeroinitializer, %broadcast.splat26 84 br label %vector.body 85 86vector.body: ; preds = %vector.body, %entry 87 %index = phi i32 [ 0, %entry ], [ %index.next, %vector.body ] 88 %l6 = getelementptr inbounds i16, ptr %s1, i32 %index 89 %wide.load = load <8 x i16>, ptr %l6, align 2 90 %l8 = trunc <8 x i16> %wide.load to <8 x i8> 91 %l9 = mul <8 x i8> %broadcast.splat26, %l8 92 %l13 = getelementptr inbounds i8, ptr %d, i32 %index 93 store <8 x i8> %l9, ptr %l13, align 1 94 %index.next = add i32 %index, 8 95 %l15 = icmp eq i32 %index.next, %n.vec 96 br i1 %l15, label %exit, label %vector.body 97 98exit: ; preds = %vector.body 99 ret i8 0 100} 101