xref: /llvm-project/llvm/test/Transforms/SLPVectorizer/extract-many-users-buildvector.ll (revision 5deb4ef9ab1144542d748f71235b029bed06dd26)
1706e7107SElvina Yakubova; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
207d284d4SAlexey Bataev; RUN: %if x86-registered-target %{ opt -S -passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s --check-prefix X86 %}
307d284d4SAlexey Bataev; RUN: %if aarch64-registered-target %{ opt -S -passes=slp-vectorizer -mtriple=aarch64-unknown-linux-gnu < %s | FileCheck %s --check-prefix AARCH64 %}
4706e7107SElvina Yakubova
5706e7107SElvina Yakubovadefine i1 @test(float %0, double %1) {
607d284d4SAlexey Bataev; X86-LABEL: define i1 @test
707d284d4SAlexey Bataev; X86-SAME: (float [[TMP0:%.*]], double [[TMP1:%.*]]) {
807d284d4SAlexey Bataev; X86-NEXT:    [[TMP3:%.*]] = insertelement <4 x float> <float 0.000000e+00, float 0.000000e+00, float 0.000000e+00, float poison>, float [[TMP0]], i32 3
907d284d4SAlexey Bataev; X86-NEXT:    [[TMP4:%.*]] = fpext <4 x float> [[TMP3]] to <4 x double>
10*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP5:%.*]] = insertelement <6 x double> <double poison, double poison, double poison, double poison, double poison, double 0.000000e+00>, double [[TMP1]], i32 4
11*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP6:%.*]] = shufflevector <4 x double> [[TMP4]], <4 x double> poison, <6 x i32> <i32 0, i32 1, i32 2, i32 3, i32 poison, i32 poison>
12*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP7:%.*]] = shufflevector <6 x double> [[TMP5]], <6 x double> [[TMP6]], <6 x i32> <i32 6, i32 7, i32 8, i32 9, i32 4, i32 5>
13*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP8:%.*]] = fmul <6 x double> zeroinitializer, [[TMP7]]
14*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP9:%.*]] = shufflevector <6 x double> [[TMP7]], <6 x double> [[TMP8]], <4 x i32> <i32 poison, i32 4, i32 11, i32 11>
15*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP10:%.*]] = shufflevector <4 x double> [[TMP9]], <4 x double> <double 0.000000e+00, double poison, double poison, double poison>, <4 x i32> <i32 4, i32 1, i32 2, i32 3>
16*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP11:%.*]] = shufflevector <6 x double> [[TMP7]], <6 x double> poison, <4 x i32> <i32 2, i32 0, i32 1, i32 poison>
17*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP12:%.*]] = shufflevector <4 x double> [[TMP11]], <4 x double> <double poison, double poison, double poison, double 0.000000e+00>, <4 x i32> <i32 0, i32 1, i32 2, i32 7>
18*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP13:%.*]] = fmul <4 x double> [[TMP10]], [[TMP12]]
19*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP14:%.*]] = call <8 x double> @llvm.vector.insert.v8f64.v4f64(<8 x double> <double poison, double poison, double poison, double poison, double 0.000000e+00, double 0.000000e+00, double 0.000000e+00, double 0.000000e+00>, <4 x double> [[TMP13]], i64 0)
20*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP15:%.*]] = call <8 x double> @llvm.vector.insert.v8f64.v6f64(<8 x double> <double poison, double poison, double poison, double poison, double poison, double poison, double 0.000000e+00, double 0.000000e+00>, <6 x double> [[TMP8]], i64 0)
21*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP16:%.*]] = fsub <8 x double> [[TMP14]], [[TMP15]]
22*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP17:%.*]] = fmul <8 x double> [[TMP14]], [[TMP15]]
23*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP18:%.*]] = shufflevector <8 x double> [[TMP16]], <8 x double> [[TMP17]], <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 13, i32 14, i32 15>
24*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP19:%.*]] = fptrunc <8 x double> [[TMP18]] to <8 x float>
25*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP20:%.*]] = fmul <8 x float> [[TMP19]], zeroinitializer
26*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP21:%.*]] = fcmp oeq <8 x float> [[TMP20]], zeroinitializer
27*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP22:%.*]] = freeze <8 x i1> [[TMP21]]
28*5deb4ef9SAlexey Bataev; X86-NEXT:    [[TMP23:%.*]] = call i1 @llvm.vector.reduce.and.v8i1(<8 x i1> [[TMP22]])
29*5deb4ef9SAlexey Bataev; X86-NEXT:    ret i1 [[TMP23]]
3007d284d4SAlexey Bataev;
3107d284d4SAlexey Bataev; AARCH64-LABEL: define i1 @test
3207d284d4SAlexey Bataev; AARCH64-SAME: (float [[TMP0:%.*]], double [[TMP1:%.*]]) {
3307d284d4SAlexey Bataev; AARCH64-NEXT:    [[TMP3:%.*]] = insertelement <4 x float> <float 0.000000e+00, float 0.000000e+00, float 0.000000e+00, float poison>, float [[TMP0]], i32 3
3407d284d4SAlexey Bataev; AARCH64-NEXT:    [[TMP4:%.*]] = fpext <4 x float> [[TMP3]] to <4 x double>
35*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP5:%.*]] = insertelement <6 x double> <double poison, double poison, double poison, double poison, double poison, double 0.000000e+00>, double [[TMP1]], i32 4
36*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP6:%.*]] = shufflevector <4 x double> [[TMP4]], <4 x double> poison, <6 x i32> <i32 0, i32 1, i32 2, i32 3, i32 poison, i32 poison>
37*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP7:%.*]] = shufflevector <6 x double> [[TMP5]], <6 x double> [[TMP6]], <6 x i32> <i32 6, i32 7, i32 8, i32 9, i32 4, i32 5>
38*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP8:%.*]] = fmul <6 x double> zeroinitializer, [[TMP7]]
39*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP9:%.*]] = shufflevector <6 x double> [[TMP7]], <6 x double> [[TMP8]], <4 x i32> <i32 poison, i32 4, i32 11, i32 11>
40*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP10:%.*]] = shufflevector <4 x double> [[TMP9]], <4 x double> <double 0.000000e+00, double poison, double poison, double poison>, <4 x i32> <i32 4, i32 1, i32 2, i32 3>
41*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP11:%.*]] = shufflevector <6 x double> [[TMP7]], <6 x double> poison, <4 x i32> <i32 2, i32 0, i32 poison, i32 poison>
42*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP12:%.*]] = shufflevector <4 x double> [[TMP11]], <4 x double> <double poison, double poison, double poison, double 0.000000e+00>, <4 x i32> <i32 0, i32 1, i32 poison, i32 7>
43*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP13:%.*]] = shufflevector <4 x double> [[TMP12]], <4 x double> [[TMP4]], <4 x i32> <i32 0, i32 1, i32 5, i32 3>
44*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP14:%.*]] = fmul <4 x double> [[TMP10]], [[TMP13]]
45*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP15:%.*]] = call <8 x double> @llvm.vector.insert.v8f64.v4f64(<8 x double> <double poison, double poison, double poison, double poison, double 0.000000e+00, double 0.000000e+00, double 0.000000e+00, double 0.000000e+00>, <4 x double> [[TMP14]], i64 0)
46*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP16:%.*]] = call <8 x double> @llvm.vector.insert.v8f64.v6f64(<8 x double> <double poison, double poison, double poison, double poison, double poison, double poison, double 0.000000e+00, double 0.000000e+00>, <6 x double> [[TMP8]], i64 0)
47*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP17:%.*]] = fsub <8 x double> [[TMP15]], [[TMP16]]
48*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP18:%.*]] = fmul <8 x double> [[TMP15]], [[TMP16]]
49*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP19:%.*]] = shufflevector <8 x double> [[TMP17]], <8 x double> [[TMP18]], <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 13, i32 14, i32 15>
50*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP20:%.*]] = fptrunc <8 x double> [[TMP19]] to <8 x float>
51*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP21:%.*]] = fmul <8 x float> [[TMP20]], zeroinitializer
52*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP22:%.*]] = fcmp oeq <8 x float> [[TMP21]], zeroinitializer
53*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP23:%.*]] = freeze <8 x i1> [[TMP22]]
54*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    [[TMP24:%.*]] = call i1 @llvm.vector.reduce.and.v8i1(<8 x i1> [[TMP23]])
55*5deb4ef9SAlexey Bataev; AARCH64-NEXT:    ret i1 [[TMP24]]
56706e7107SElvina Yakubova;
57706e7107SElvina Yakubova  %3 = fpext float %0 to double
58706e7107SElvina Yakubova  %4 = fpext float 0.000000e+00 to double
59706e7107SElvina Yakubova  %5 = fpext float 0.000000e+00 to double
60706e7107SElvina Yakubova  %6 = fpext float 0.000000e+00 to double
61706e7107SElvina Yakubova  %7 = fmul double 0.000000e+00, 0.000000e+00
62706e7107SElvina Yakubova  %8 = fmul double 0.000000e+00, %1
63706e7107SElvina Yakubova  %9 = fmul double 0.000000e+00, 0.000000e+00
64706e7107SElvina Yakubova  %10 = fmul double 0.000000e+00, %5
65706e7107SElvina Yakubova  %11 = fmul double 0.000000e+00, %6
66706e7107SElvina Yakubova  %12 = fsub double %10, %11
67706e7107SElvina Yakubova  %13 = fptrunc double %12 to float
68706e7107SElvina Yakubova  %14 = fmul double %9, 0.000000e+00
69706e7107SElvina Yakubova  %15 = fmul double 0.000000e+00, %3
70706e7107SElvina Yakubova  %16 = fsub double %14, %15
71706e7107SElvina Yakubova  %17 = fptrunc double %16 to float
72706e7107SElvina Yakubova  %18 = fptrunc double %7 to float
73706e7107SElvina Yakubova  %19 = fmul double %1, %6
74706e7107SElvina Yakubova  %20 = fmul double 0.000000e+00, %4
75706e7107SElvina Yakubova  %21 = fsub double %19, %20
76706e7107SElvina Yakubova  %22 = fptrunc double %21 to float
77706e7107SElvina Yakubova  %23 = fsub double 0.000000e+00, %8
78706e7107SElvina Yakubova  %24 = fptrunc double %23 to float
79706e7107SElvina Yakubova  %25 = fmul double 0.000000e+00, 0.000000e+00
80706e7107SElvina Yakubova  %26 = fptrunc double %25 to float
81706e7107SElvina Yakubova  %27 = fmul double %9, %4
82706e7107SElvina Yakubova  %28 = fmul double 0.000000e+00, %5
83706e7107SElvina Yakubova  %29 = fsub double %27, %28
84706e7107SElvina Yakubova  %30 = fptrunc double %29 to float
85706e7107SElvina Yakubova  %31 = fmul double %9, 0.000000e+00
86706e7107SElvina Yakubova  %32 = fptrunc double %31 to float
87706e7107SElvina Yakubova  %33 = fmul float %13, 0.000000e+00
88706e7107SElvina Yakubova  %34 = fcmp oeq float %33, 0.000000e+00
89706e7107SElvina Yakubova  %35 = fmul float %22, 0.000000e+00
90706e7107SElvina Yakubova  %36 = fcmp oeq float %35, 0.000000e+00
91706e7107SElvina Yakubova  %37 = select i1 %34, i1 %36, i1 false
92706e7107SElvina Yakubova  %38 = fmul float %30, 0.000000e+00
93706e7107SElvina Yakubova  %39 = fcmp oeq float %38, 0.000000e+00
94706e7107SElvina Yakubova  %40 = select i1 %37, i1 %39, i1 false
95706e7107SElvina Yakubova  %41 = fmul float %17, 0.000000e+00
96706e7107SElvina Yakubova  %42 = fcmp oeq float %41, 0.000000e+00
97706e7107SElvina Yakubova  %43 = select i1 %40, i1 %42, i1 false
98706e7107SElvina Yakubova  %44 = fmul float %24, 0.000000e+00
99706e7107SElvina Yakubova  %45 = fcmp oeq float %44, 0.000000e+00
100706e7107SElvina Yakubova  %46 = select i1 %43, i1 %45, i1 false
101706e7107SElvina Yakubova  %47 = fmul float %32, 0.000000e+00
102706e7107SElvina Yakubova  %48 = fcmp oeq float %47, 0.000000e+00
103706e7107SElvina Yakubova  %49 = select i1 %46, i1 %48, i1 false
104706e7107SElvina Yakubova  %50 = fmul float %18, 0.000000e+00
105706e7107SElvina Yakubova  %51 = fcmp oeq float %50, 0.000000e+00
106706e7107SElvina Yakubova  %52 = select i1 %49, i1 %51, i1 false
107706e7107SElvina Yakubova  %53 = fmul float %26, 0.000000e+00
108706e7107SElvina Yakubova  %54 = fcmp oeq float %53, 0.000000e+00
109706e7107SElvina Yakubova  %55 = select i1 %52, i1 %54, i1 false
110706e7107SElvina Yakubova  ret i1 %55
111706e7107SElvina Yakubova}
112