xref: /llvm-project/llvm/test/Transforms/SLPVectorizer/X86/bv-shuffle-mask.ll (revision 681c83a2f99431d4bb9d4975a08771320e30a80b)
1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s
3
4define i16 @test(i16 %v1, i16 %v2) {
5; CHECK-LABEL: define i16 @test(
6; CHECK-SAME: i16 [[V1:%.*]], i16 [[V2:%.*]]) {
7; CHECK-NEXT:  [[ENTRY:.*:]]
8; CHECK-NEXT:    [[TMP0:%.*]] = insertelement <4 x i16> <i16 0, i16 0, i16 0, i16 poison>, i16 [[V2]], i32 3
9; CHECK-NEXT:    [[TMP1:%.*]] = insertelement <4 x i16> <i16 0, i16 0, i16 0, i16 poison>, i16 [[V1]], i32 3
10; CHECK-NEXT:    [[TMP2:%.*]] = or <4 x i16> [[TMP0]], [[TMP1]]
11; CHECK-NEXT:    [[TMP3:%.*]] = and <4 x i16> [[TMP0]], [[TMP1]]
12; CHECK-NEXT:    [[TMP4:%.*]] = shufflevector <4 x i16> [[TMP2]], <4 x i16> [[TMP3]], <4 x i32> <i32 0, i32 1, i32 2, i32 7>
13; CHECK-NEXT:    [[TMP5:%.*]] = shufflevector <4 x i16> [[TMP0]], <4 x i16> poison, <2 x i32> <i32 poison, i32 3>
14; CHECK-NEXT:    [[TMP6:%.*]] = insertelement <2 x i16> [[TMP5]], i16 [[V1]], i32 0
15; CHECK-NEXT:    [[TMP7:%.*]] = shufflevector <2 x i16> [[TMP6]], <2 x i16> poison, <4 x i32> <i32 0, i32 0, i32 0, i32 1>
16; CHECK-NEXT:    [[TMP8:%.*]] = or <4 x i16> [[TMP7]], zeroinitializer
17; CHECK-NEXT:    [[TMP9:%.*]] = and <4 x i16> [[TMP4]], zeroinitializer
18; CHECK-NEXT:    [[TMP10:%.*]] = and <4 x i16> [[TMP9]], zeroinitializer
19; CHECK-NEXT:    [[TMP11:%.*]] = icmp ne <4 x i16> [[TMP10]], zeroinitializer
20; CHECK-NEXT:    [[TMP12:%.*]] = or <4 x i1> [[TMP11]], zeroinitializer
21; CHECK-NEXT:    [[TMP13:%.*]] = or <4 x i16> [[TMP8]], zeroinitializer
22; CHECK-NEXT:    [[TMP14:%.*]] = or <4 x i16> [[TMP13]], zeroinitializer
23; CHECK-NEXT:    [[TMP15:%.*]] = or <4 x i16> [[TMP14]], zeroinitializer
24; CHECK-NEXT:    [[TMP16:%.*]] = icmp ne <4 x i16> [[TMP15]], zeroinitializer
25; CHECK-NEXT:    [[TMP17:%.*]] = or <4 x i1> zeroinitializer, [[TMP16]]
26; CHECK-NEXT:    [[TMP18:%.*]] = or <4 x i1> [[TMP12]], [[TMP17]]
27; CHECK-NEXT:    [[TMP19:%.*]] = extractelement <4 x i1> [[TMP18]], i32 2
28; CHECK-NEXT:    [[TMP20:%.*]] = extractelement <4 x i1> [[TMP18]], i32 3
29; CHECK-NEXT:    [[TMP21:%.*]] = or i1 [[TMP20]], [[TMP19]]
30; CHECK-NEXT:    [[TMP22:%.*]] = extractelement <4 x i1> [[TMP18]], i32 1
31; CHECK-NEXT:    [[TMP23:%.*]] = or i1 false, [[TMP22]]
32; CHECK-NEXT:    [[TMP24:%.*]] = freeze <4 x i1> [[TMP18]]
33; CHECK-NEXT:    [[TMP25:%.*]] = call i1 @llvm.vector.reduce.or.v4i1(<4 x i1> [[TMP24]])
34; CHECK-NEXT:    [[SPEC_SELECT31:%.*]] = select i1 [[TMP25]], i32 0, i32 0
35; CHECK-NEXT:    [[TMP26:%.*]] = extractelement <4 x i1> [[TMP18]], i32 0
36; CHECK-NEXT:    [[TMP27:%.*]] = or i1 false, [[TMP26]]
37; CHECK-NEXT:    store i32 [[SPEC_SELECT31]], ptr null, align 4
38; CHECK-NEXT:    ret i16 0
39;
40entry:
41  %0 = and i16 %v2, %v1
42  %1 = and i16 %0, 0
43  %2 = and i16 %1, 0
44  %3 = icmp ne i16 %2, 0
45  %.not5.not = or i1 %3, false
46  %inc.1.1.i82.i.i = or i16 %v2, 0
47  %inc.143.1.i98.i.i = or i16 0, 0
48  %4 = or i16 %inc.1.1.i82.i.i, 0
49  %5 = or i16 %4, 0
50  %6 = or i16 %5, 0
51  %7 = icmp ne i16 %6, 0
52  %.not7.not = or i1 false, %7
53  %8 = or i1 %.not5.not, %.not7.not
54  %9 = and i16 0, %inc.143.1.i98.i.i
55  %10 = and i16 %9, 0
56  %11 = icmp ne i16 %10, 0
57  %.not5.not.1 = or i1 %11, false
58  %inc.143.i76.i.i.1 = or i16 %v1, 0
59  %inc.143.1.i98.i.i.1 = or i16 0, 0
60  %12 = or i16 0, %inc.143.i76.i.i.1
61  %13 = or i16 %12, 0
62  %14 = or i16 %13, 0
63  %15 = icmp ne i16 %14, 0
64  %.not7.not.1 = or i1 false, %15
65  %16 = or i1 %.not5.not.1, %.not7.not.1
66  %17 = or i1 %8, %16
67  %18 = and i16 0, %inc.143.1.i98.i.i.1
68  %19 = and i16 %18, 0
69  %20 = icmp ne i16 %19, 0
70  %.not5.not.2 = or i1 %20, false
71  %inc.143.i76.i.i.2 = or i16 %v1, 0
72  %inc.143.1.i98.i.i.2 = or i16 0, 0
73  %21 = or i16 0, %inc.143.i76.i.i.2
74  %22 = or i16 %21, 0
75  %23 = or i16 %22, 0
76  %24 = icmp ne i16 %23, 0
77  %.not7.not.2 = or i1 false, %24
78  %25 = or i1 %.not5.not.2, %.not7.not.2
79  %26 = or i1 false, %25
80  %27 = and i16 0, %inc.143.1.i98.i.i.2
81  %28 = and i16 %27, 0
82  %29 = icmp ne i16 %28, 0
83  %.not5.not.3 = or i1 %29, false
84  %inc.143.i76.i.i.3 = or i16 %v1, 0
85  %30 = or i16 0, %inc.143.i76.i.i.3
86  %31 = or i16 %30, 0
87  %32 = or i16 %31, 0
88  %33 = icmp ne i16 %32, 0
89  %.not7.not.3 = or i1 false, %33
90  %34 = or i1 %.not5.not.3, %.not7.not.3
91  %35 = select i1 %34, i1 true, i1 %25
92  %36 = select i1 %35, i1 true, i1 %16
93  %37 = select i1 %36, i1 true, i1 %8
94  %spec.select31 = select i1 %37, i32 0, i32 0
95  %38 = or i1 false, %34
96  store i32 %spec.select31, ptr null, align 4
97  ret i16 0
98}
99