xref: /llvm-project/llvm/test/Transforms/SLPVectorizer/X86/buildvector-shuffle.ll (revision 8b56da5e9f3ba737a5ff4bf5dee654416849042f)
1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2; RUN: opt -S -passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s
3
4define void @b() {
5; CHECK-LABEL: @b(
6; CHECK-NEXT:  entry:
7; CHECK-NEXT:    [[TMP0:%.*]] = insertelement <4 x float> poison, float 0x7FF8000000000000, i32 0
8; CHECK-NEXT:    [[TMP1:%.*]] = shufflevector <4 x float> [[TMP0]], <4 x float> <float 0xFFF8000000000000, float 0xFFF8000000000000, float undef, float undef>, <4 x i32> <i32 0, i32 4, i32 5, i32 poison>
9; CHECK-NEXT:    [[TMP2:%.*]] = insertelement <4 x float> [[TMP1]], float 0x7FF8000000000000, i32 3
10; CHECK-NEXT:    [[TMP3:%.*]] = call <4 x float> @llvm.fmuladd.v4f32(<4 x float> [[TMP2]], <4 x float> zeroinitializer, <4 x float> zeroinitializer)
11; CHECK-NEXT:    [[TMP4:%.*]] = fmul <4 x float> [[TMP3]], <float undef, float undef, float undef, float 2.000000e+00>
12; CHECK-NEXT:    [[TMP5:%.*]] = fdiv <4 x float> [[TMP4]], zeroinitializer
13; CHECK-NEXT:    store <4 x float> [[TMP5]], ptr undef, align 4
14; CHECK-NEXT:    ret void
15;
16entry:
17  %mul = fmul float undef, 2.000000e+00
18  %i = tail call float @llvm.fmuladd.f32(float %mul, float 0.000000e+00, float 0.000000e+00)
19  %mul2 = fmul float undef, %i
20  %add = fadd float undef, 1.000000e+00
21  %neg = fneg float %add
22  %i1 = tail call float @llvm.fmuladd.f32(float %neg, float 0.000000e+00, float 0.000000e+00)
23  %mul4 = fmul float undef, %i1
24  %neg7 = fneg float %mul
25  %i2 = tail call float @llvm.fmuladd.f32(float %neg7, float 0.000000e+00, float 0.000000e+00)
26  %mul8 = fmul float undef, %i2
27  %i3 = tail call float @llvm.fmuladd.f32(float %add, float 0.000000e+00, float 0.000000e+00)
28  %mul11 = fmul float %i3, 2.000000e+00
29  %div = fdiv float %mul2, 0.000000e+00
30  store float %div, ptr undef, align 4
31  %div12 = fdiv float %mul4, 0.000000e+00
32  %arrayidx13 = getelementptr inbounds float, ptr undef, i64 1
33  store float %div12, ptr %arrayidx13, align 4
34  %div14 = fdiv float %mul8, 0.000000e+00
35  %arrayidx15 = getelementptr inbounds float, ptr undef, i64 2
36  store float %div14, ptr %arrayidx15, align 4
37  %div16 = fdiv float %mul11, 0.000000e+00
38  %arrayidx17 = getelementptr inbounds float, ptr undef, i64 3
39  store float %div16, ptr %arrayidx17, align 4
40  ret void
41}
42
43declare float @llvm.fmuladd.f32(float, float, float)
44
45define void @test(float %a) {
46; CHECK-LABEL: @test(
47; CHECK-NEXT:  entry:
48; CHECK-NEXT:    [[TMP0:%.*]] = insertelement <2 x float> poison, float [[A:%.*]], i32 0
49; CHECK-NEXT:    [[SHUFFLE:%.*]] = shufflevector <2 x float> [[TMP0]], <2 x float> poison, <2 x i32> zeroinitializer
50; CHECK-NEXT:    br label [[LOOP:%.*]]
51; CHECK:       loop:
52; CHECK-NEXT:    [[TMP1:%.*]] = fadd <2 x float> zeroinitializer, [[SHUFFLE]]
53; CHECK-NEXT:    [[TMP2:%.*]] = shufflevector <2 x float> [[TMP1]], <2 x float> poison, <2 x i32> zeroinitializer
54; CHECK-NEXT:    br label [[LOOP]]
55;
56entry:
57  br label %loop
58
59loop:
60  %add.i157 = fadd float 0.000000e+00, %a
61  %add23.i = fadd float 0.000000e+00, %a
62  %insert = insertelement <2 x float> zeroinitializer, float %add.i157, i64 0
63  %insert.i = insertelement <2 x float> %insert, float %add23.i, i64 1
64  %agg = insertelement <2 x float> %insert.i, float %add.i157, i64 1
65  br label %loop
66}
67
68define internal void @test1() {
69; CHECK-LABEL: @test1(
70; CHECK-NEXT:  entry:
71; CHECK-NEXT:    br label [[LOOP:%.*]]
72; CHECK:       loop:
73; CHECK-NEXT:    [[DOTSROA_025_4_VEC_INSERT_US_I:%.*]] = insertelement <2 x float> zeroinitializer, float 0.000000e+00, i64 0
74; CHECK-NEXT:    br label [[LOOP]]
75;
76entry:
77  br label %loop
78
79loop:
80  %0 = fadd float 0.000000e+00, 0.000000e+00
81  %1 = fadd float 0.000000e+00, 0.000000e+00
82  %2 = fadd float %0, 0.000000e+00
83  %3 = fadd float %1, 0.000000e+00
84  %.sroa.3.8.vec.insert.i.us.i = insertelement <2 x float> zeroinitializer, float %2, i64 0
85  %.sroa.3.12.vec.insert.i.us.i = insertelement <2 x float> %.sroa.3.8.vec.insert.i.us.i, float %3, i64 1
86  %.sroa.025.4.vec.insert.us.i = insertelement <2 x float> %.sroa.3.12.vec.insert.i.us.i, float %0, i64 0
87  br label %loop
88}
89