xref: /llvm-project/llvm/test/Transforms/CodeGenPrepare/ARM/sinkchain.ll (revision d9e51e75521d5e33f24a6c1afacae5dbc115f96d)
1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2; RUN: opt -mtriple=thumbv8.1m.main-none-none-eabi -mattr=+mve.fp < %s -codegenprepare -S | FileCheck -check-prefix=CHECK %s
3; RUN: opt -mtriple=thumbv8.1m.main-none-none-eabi -mattr=+mve.fp < %s -codegenprepare -cgpp-huge-func=0 -S | FileCheck -check-prefix=CHECK %s
4
5; Sink the shufflevector/insertelement pair, followed by the trunc. The sunk instruction end up dead.
6define signext i8 @dead(ptr noalias nocapture readonly %s1, i16 zeroext %x, ptr noalias nocapture %d, i32 %n) {
7; CHECK-LABEL: @dead(
8; CHECK-NEXT:  entry:
9; CHECK-NEXT:    [[N_VEC:%.*]] = and i32 [[N:%.*]], -8
10; CHECK-NEXT:    br label [[VECTOR_BODY:%.*]]
11; CHECK:       vector.body:
12; CHECK-NEXT:    [[INDEX:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ]
13; CHECK-NEXT:    [[TMP0:%.*]] = trunc i16 [[X:%.*]] to i8
14; CHECK-NEXT:    [[L6:%.*]] = getelementptr inbounds i16, ptr [[S1:%.*]], i32 [[INDEX]]
15; CHECK-NEXT:    [[WIDE_LOAD:%.*]] = load <8 x i16>, ptr [[L6]], align 2
16; CHECK-NEXT:    [[L8:%.*]] = trunc <8 x i16> [[WIDE_LOAD]] to <8 x i8>
17; CHECK-NEXT:    [[TMP1:%.*]] = insertelement <8 x i8> undef, i8 [[TMP0]], i32 0
18; CHECK-NEXT:    [[TMP2:%.*]] = shufflevector <8 x i8> [[TMP1]], <8 x i8> undef, <8 x i32> zeroinitializer
19; CHECK-NEXT:    [[L9:%.*]] = mul <8 x i8> [[TMP2]], [[L8]]
20; CHECK-NEXT:    [[L13:%.*]] = getelementptr inbounds i8, ptr [[D:%.*]], i32 [[INDEX]]
21; CHECK-NEXT:    store <8 x i8> [[L9]], ptr [[L13]], align 1
22; CHECK-NEXT:    [[INDEX_NEXT]] = add i32 [[INDEX]], 8
23; CHECK-NEXT:    [[L15:%.*]] = icmp eq i32 [[INDEX_NEXT]], [[N_VEC]]
24; CHECK-NEXT:    br i1 [[L15]], label [[EXIT:%.*]], label [[VECTOR_BODY]]
25; CHECK:       exit:
26; CHECK-NEXT:    ret i8 0
27;
28entry:
29  %n.vec = and i32 %n, -8
30  %l0 = trunc i16 %x to i8
31  %l1 = insertelement <8 x i8> undef, i8 %l0, i32 0
32  %broadcast.splat26 = shufflevector <8 x i8> %l1, <8 x i8> undef, <8 x i32> zeroinitializer
33  br label %vector.body
34
35vector.body:                                      ; preds = %vector.body, %entry
36  %index = phi i32 [ 0, %entry ], [ %index.next, %vector.body ]
37  %l6 = getelementptr inbounds i16, ptr %s1, i32 %index
38  %wide.load = load <8 x i16>, ptr %l6, align 2
39  %l8 = trunc <8 x i16> %wide.load to <8 x i8>
40  %l9 = mul <8 x i8> %broadcast.splat26, %l8
41  %l13 = getelementptr inbounds i8, ptr %d, i32 %index
42  store <8 x i8> %l9, ptr %l13, align 1
43  %index.next = add i32 %index, 8
44  %l15 = icmp eq i32 %index.next, %n.vec
45  br i1 %l15, label %exit, label %vector.body
46
47exit:                                     ; preds = %vector.body
48  ret i8 0
49}
50
51; Same as above, but the shuffle has an extra use meaning it shouldnt be deleted
52define signext i8 @alive(ptr noalias nocapture readonly %s1, i16 zeroext %x, ptr noalias nocapture %d, i32 %n) {
53; CHECK-LABEL: @alive(
54; CHECK-NEXT:  entry:
55; CHECK-NEXT:    [[N_VEC:%.*]] = and i32 [[N:%.*]], -8
56; CHECK-NEXT:    [[L0:%.*]] = trunc i16 [[X:%.*]] to i8
57; CHECK-NEXT:    [[L1:%.*]] = insertelement <8 x i8> undef, i8 [[L0]], i32 0
58; CHECK-NEXT:    [[BROADCAST_SPLAT26:%.*]] = shufflevector <8 x i8> [[L1]], <8 x i8> undef, <8 x i32> zeroinitializer
59; CHECK-NEXT:    [[L2:%.*]] = sub <8 x i8> zeroinitializer, [[BROADCAST_SPLAT26]]
60; CHECK-NEXT:    br label [[VECTOR_BODY:%.*]]
61; CHECK:       vector.body:
62; CHECK-NEXT:    [[INDEX:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ]
63; CHECK-NEXT:    [[TMP0:%.*]] = trunc i16 [[X]] to i8
64; CHECK-NEXT:    [[L6:%.*]] = getelementptr inbounds i16, ptr [[S1:%.*]], i32 [[INDEX]]
65; CHECK-NEXT:    [[WIDE_LOAD:%.*]] = load <8 x i16>, ptr [[L6]], align 2
66; CHECK-NEXT:    [[L8:%.*]] = trunc <8 x i16> [[WIDE_LOAD]] to <8 x i8>
67; CHECK-NEXT:    [[TMP1:%.*]] = insertelement <8 x i8> undef, i8 [[TMP0]], i32 0
68; CHECK-NEXT:    [[TMP2:%.*]] = shufflevector <8 x i8> [[TMP1]], <8 x i8> undef, <8 x i32> zeroinitializer
69; CHECK-NEXT:    [[L9:%.*]] = mul <8 x i8> [[TMP2]], [[L8]]
70; CHECK-NEXT:    [[L13:%.*]] = getelementptr inbounds i8, ptr [[D:%.*]], i32 [[INDEX]]
71; CHECK-NEXT:    store <8 x i8> [[L9]], ptr [[L13]], align 1
72; CHECK-NEXT:    [[INDEX_NEXT]] = add i32 [[INDEX]], 8
73; CHECK-NEXT:    [[L15:%.*]] = icmp eq i32 [[INDEX_NEXT]], [[N_VEC]]
74; CHECK-NEXT:    br i1 [[L15]], label [[EXIT:%.*]], label [[VECTOR_BODY]]
75; CHECK:       exit:
76; CHECK-NEXT:    ret i8 0
77;
78entry:
79  %n.vec = and i32 %n, -8
80  %l0 = trunc i16 %x to i8
81  %l1 = insertelement <8 x i8> undef, i8 %l0, i32 0
82  %broadcast.splat26 = shufflevector <8 x i8> %l1, <8 x i8> undef, <8 x i32> zeroinitializer
83  %l2 = sub <8 x i8> zeroinitializer, %broadcast.splat26
84  br label %vector.body
85
86vector.body:                                      ; preds = %vector.body, %entry
87  %index = phi i32 [ 0, %entry ], [ %index.next, %vector.body ]
88  %l6 = getelementptr inbounds i16, ptr %s1, i32 %index
89  %wide.load = load <8 x i16>, ptr %l6, align 2
90  %l8 = trunc <8 x i16> %wide.load to <8 x i8>
91  %l9 = mul <8 x i8> %broadcast.splat26, %l8
92  %l13 = getelementptr inbounds i8, ptr %d, i32 %index
93  store <8 x i8> %l9, ptr %l13, align 1
94  %index.next = add i32 %index, 8
95  %l15 = icmp eq i32 %index.next, %n.vec
96  br i1 %l15, label %exit, label %vector.body
97
98exit:                                     ; preds = %vector.body
99  ret i8 0
100}
101