xref: /llvm-project/llvm/test/Transforms/SLPVectorizer/X86/subvector-minbitwidth-unsigned-value.ll (revision 38fffa630ee80163dc65e759392ad29798905679)
1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s
3
4define i1 @test(i64 %v1, ptr %v2, i32 %v3, i1 %v4) {
5; CHECK-LABEL: define i1 @test(
6; CHECK-SAME: i64 [[V1:%.*]], ptr [[V2:%.*]], i32 [[V3:%.*]], i1 [[V4:%.*]]) {
7; CHECK-NEXT:  [[NEWFUNCROOT:.*:]]
8; CHECK-NEXT:    [[TMP0:%.*]] = insertelement <2 x i64> poison, i64 [[V1]], i32 0
9; CHECK-NEXT:    [[TMP1:%.*]] = shufflevector <2 x i64> [[TMP0]], <2 x i64> poison, <2 x i32> zeroinitializer
10; CHECK-NEXT:    [[TMP2:%.*]] = lshr <2 x i64> [[TMP1]], <i64 32, i64 40>
11; CHECK-NEXT:    [[TMP3:%.*]] = trunc <2 x i64> [[TMP2]] to <2 x i8>
12; CHECK-NEXT:    [[TMP4:%.*]] = and <2 x i8> [[TMP3]], <i8 1, i8 -1>
13; CHECK-NEXT:    [[TMP5:%.*]] = zext <2 x i8> [[TMP4]] to <2 x i32>
14; CHECK-NEXT:    [[TMP6:%.*]] = icmp eq <2 x i32> [[TMP5]], zeroinitializer
15; CHECK-NEXT:    [[TMP7:%.*]] = insertelement <4 x i32> poison, i32 [[V3]], i32 0
16; CHECK-NEXT:    [[TMP8:%.*]] = shufflevector <4 x i32> [[TMP7]], <4 x i32> poison, <4 x i32> <i32 poison, i32 poison, i32 0, i32 0>
17; CHECK-NEXT:    [[TMP9:%.*]] = zext <2 x i8> [[TMP4]] to <2 x i32>
18; CHECK-NEXT:    [[TMP10:%.*]] = call <4 x i32> @llvm.vector.insert.v4i32.v2i32(<4 x i32> [[TMP8]], <2 x i32> [[TMP9]], i64 0)
19; CHECK-NEXT:    [[TMP11:%.*]] = uitofp <4 x i32> [[TMP10]] to <4 x float>
20; CHECK-NEXT:    [[TMP12:%.*]] = fdiv <4 x float> zeroinitializer, [[TMP11]]
21; CHECK-NEXT:    [[TMP13:%.*]] = insertelement <4 x i1> poison, i1 [[V4]], i32 0
22; CHECK-NEXT:    [[TMP14:%.*]] = shufflevector <4 x i1> [[TMP13]], <4 x i1> poison, <4 x i32> <i32 poison, i32 poison, i32 0, i32 0>
23; CHECK-NEXT:    [[TMP15:%.*]] = call <4 x i1> @llvm.vector.insert.v4i1.v2i1(<4 x i1> [[TMP14]], <2 x i1> [[TMP6]], i64 0)
24; CHECK-NEXT:    [[TMP16:%.*]] = select <4 x i1> [[TMP15]], <4 x float> zeroinitializer, <4 x float> [[TMP12]]
25; CHECK-NEXT:    [[TMP17:%.*]] = extractelement <4 x float> [[TMP16]], i32 3
26; CHECK-NEXT:    [[CONV_I_I1743_3:%.*]] = fptoui float [[TMP17]] to i32
27; CHECK-NEXT:    [[TMP18:%.*]] = icmp ne i32 [[CONV_I_I1743_3]], 0
28; CHECK-NEXT:    [[TMP19:%.*]] = bitcast <4 x float> [[TMP16]] to <4 x i32>
29; CHECK-NEXT:    [[TMP20:%.*]] = icmp ult <4 x i32> [[TMP19]], splat (i32 1333788672)
30; CHECK-NEXT:    [[TMP21:%.*]] = extractelement <4 x i1> [[TMP20]], i32 3
31; CHECK-NEXT:    [[NARROW:%.*]] = select i1 [[TMP21]], i1 [[TMP18]], i1 false
32; CHECK-NEXT:    [[TMP22:%.*]] = extractelement <4 x float> [[TMP16]], i32 2
33; CHECK-NEXT:    [[CONV_I_I1743_2:%.*]] = fptoui float [[TMP22]] to i32
34; CHECK-NEXT:    [[TMP23:%.*]] = extractelement <4 x i1> [[TMP20]], i32 2
35; CHECK-NEXT:    [[NARROW1:%.*]] = select i1 [[TMP23]], i32 [[CONV_I_I1743_2]], i32 0
36; CHECK-NEXT:    [[TMP24:%.*]] = zext i1 [[NARROW]] to i32
37; CHECK-NEXT:    [[TMP25:%.*]] = or i32 [[NARROW1]], [[TMP24]]
38; CHECK-NEXT:    [[TMP26:%.*]] = extractelement <4 x float> [[TMP16]], i32 1
39; CHECK-NEXT:    [[CONV_I_I1743_1:%.*]] = fptoui float [[TMP26]] to i32
40; CHECK-NEXT:    [[TMP27:%.*]] = extractelement <4 x i1> [[TMP20]], i32 1
41; CHECK-NEXT:    [[NARROW2:%.*]] = select i1 [[TMP27]], i32 [[CONV_I_I1743_1]], i32 0
42; CHECK-NEXT:    [[RV3:%.*]] = or i32 [[TMP25]], [[NARROW2]]
43; CHECK-NEXT:    [[TMP28:%.*]] = extractelement <4 x float> [[TMP16]], i32 0
44; CHECK-NEXT:    [[CONV_I_I1743:%.*]] = fptoui float [[TMP28]] to i32
45; CHECK-NEXT:    [[TMP29:%.*]] = extractelement <4 x i1> [[TMP20]], i32 0
46; CHECK-NEXT:    [[NARROW4:%.*]] = select i1 [[TMP29]], i32 [[CONV_I_I1743]], i32 0
47; CHECK-NEXT:    [[RT5:%.*]] = or i32 [[RV3]], [[NARROW4]]
48; CHECK-NEXT:    [[RT:%.*]] = zext i32 [[RT5]] to i64
49; CHECK-NEXT:    store i64 [[RT]], ptr [[V2]], align 1
50; CHECK-NEXT:    ret i1 false
51;
52newFuncRoot:
53  %conv.i147.i1756.3 = uitofp i32 %v3 to float
54  %div.i.i.i1749.3 = fdiv float 0.000000e+00, %conv.i147.i1756.3
55  %cond.i.i.i1751.3 = select i1 %v4, float 0.000000e+00, float %div.i.i.i1749.3
56  %conv.i147.i1756.2 = uitofp i32 %v3 to float
57  %div.i.i.i1749.2 = fdiv float 0.000000e+00, %conv.i147.i1756.2
58  %cond.i.i.i1751.2 = select i1 %v4, float 0.000000e+00, float %div.i.i.i1749.2
59  %0 = lshr i64 %v1, 40
60  %1 = trunc i64 %0 to i32
61  %tt2 = and i32 %1, 255
62  %cmp1.i.i.i1746.1 = icmp eq i32 %tt2, 0
63  %conv.i147.i1756.1 = uitofp i32 %tt2 to float
64  %div.i.i.i1749.1 = fdiv float 0.000000e+00, %conv.i147.i1756.1
65  %cond.i.i.i1751.1 = select i1 %cmp1.i.i.i1746.1, float 0.000000e+00, float %div.i.i.i1749.1
66  %tt3 = lshr i64 %v1, 32
67  %2 = trunc i64 %tt3 to i32
68  %tt1 = and i32 %2, 1
69  %cmp1.i.i.i1746 = icmp eq i32 %tt1, 0
70  %conv.i147.i1756 = uitofp i32 %tt1 to float
71  %div.i.i.i1749 = fdiv float 0.000000e+00, %conv.i147.i1756
72  %cond.i.i.i1751 = select i1 %cmp1.i.i.i1746, float 0.000000e+00, float %div.i.i.i1749
73  %3 = bitcast float %cond.i.i.i1751.3 to i32
74  %cmp.i99.i1736.3 = icmp ult i32 %3, 1333788672
75  %conv.i.i1743.3 = fptoui float %cond.i.i.i1751.3 to i32
76  %4 = icmp ne i32 %conv.i.i1743.3, 0
77  %narrow = select i1 %cmp.i99.i1736.3, i1 %4, i1 false
78  %5 = bitcast float %cond.i.i.i1751.2 to i32
79  %cmp.i99.i1736.2 = icmp ult i32 %5, 1333788672
80  %conv.i.i1743.2 = fptoui float %cond.i.i.i1751.2 to i32
81  %narrow1 = select i1 %cmp.i99.i1736.2, i32 %conv.i.i1743.2, i32 0
82  %6 = zext i1 %narrow to i32
83  %7 = or i32 %narrow1, %6
84  %8 = bitcast float %cond.i.i.i1751.1 to i32
85  %cmp.i99.i1736.1 = icmp ult i32 %8, 1333788672
86  %conv.i.i1743.1 = fptoui float %cond.i.i.i1751.1 to i32
87  %narrow2 = select i1 %cmp.i99.i1736.1, i32 %conv.i.i1743.1, i32 0
88  %rv3 = or i32 %7, %narrow2
89  %9 = bitcast float %cond.i.i.i1751 to i32
90  %cmp.i99.i1736 = icmp ult i32 %9, 1333788672
91  %conv.i.i1743 = fptoui float %cond.i.i.i1751 to i32
92  %narrow4 = select i1 %cmp.i99.i1736, i32 %conv.i.i1743, i32 0
93  %rt5 = or i32 %rv3, %narrow4
94  %rt = zext i32 %rt5 to i64
95  store i64 %rt, ptr %v2, align 1
96  ret i1 false
97}
98