xref: /llvm-project/llvm/test/Transforms/SLPVectorizer/RISCV/reversed-strided-node-with-external-ptr.ll (revision 3133acf1fbd1cc57ea8e74288ee9a0acd027d749)
1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2; RUN: opt -S --passes=slp-vectorizer -slp-threshold=-99999 -mtriple=riscv64 -mattr=+v < %s | FileCheck %s
3
4define void @test(ptr %a, i64 %0) {
5; CHECK-LABEL: define void @test(
6; CHECK-SAME: ptr [[A:%.*]], i64 [[TMP0:%.*]]) #[[ATTR0:[0-9]+]] {
7; CHECK-NEXT:  [[ENTRY:.*:]]
8; CHECK-NEXT:    [[TMP1:%.*]] = insertelement <2 x ptr> poison, ptr [[A]], i32 0
9; CHECK-NEXT:    [[TMP2:%.*]] = shufflevector <2 x ptr> [[TMP1]], <2 x ptr> poison, <2 x i32> zeroinitializer
10; CHECK-NEXT:    br label %[[BB:.*]]
11; CHECK:       [[BB]]:
12; CHECK-NEXT:    [[TMP3:%.*]] = or disjoint i64 [[TMP0]], 1
13; CHECK-NEXT:    [[TMP4:%.*]] = insertelement <2 x i64> poison, i64 [[TMP3]], i32 0
14; CHECK-NEXT:    [[TMP5:%.*]] = insertelement <2 x i64> [[TMP4]], i64 0, i32 1
15; CHECK-NEXT:    [[TMP6:%.*]] = getelementptr double, <2 x ptr> [[TMP2]], <2 x i64> [[TMP5]]
16; CHECK-NEXT:    [[ARRAYIDX17_I28_1:%.*]] = getelementptr double, ptr [[A]], i64 [[TMP3]]
17; CHECK-NEXT:    [[TMP7:%.*]] = call <2 x double> @llvm.masked.gather.v2f64.v2p0(<2 x ptr> [[TMP6]], i32 8, <2 x i1> splat (i1 true), <2 x double> poison)
18; CHECK-NEXT:    [[TMP8:%.*]] = load <2 x double>, ptr [[A]], align 8
19; CHECK-NEXT:    [[TMP9:%.*]] = load <2 x double>, ptr [[A]], align 8
20; CHECK-NEXT:    [[TMP10:%.*]] = fsub <2 x double> [[TMP8]], [[TMP9]]
21; CHECK-NEXT:    [[TMP11:%.*]] = fsub <2 x double> [[TMP7]], [[TMP10]]
22; CHECK-NEXT:    call void @llvm.experimental.vp.strided.store.v2f64.p0.i64(<2 x double> [[TMP11]], ptr align 8 [[ARRAYIDX17_I28_1]], i64 -8, <2 x i1> splat (i1 true), i32 2)
23; CHECK-NEXT:    br label %[[BB]]
24;
25entry:
26  br label %bb
27
28bb:
29  %indvars.iv.next239.i = add i64 0, 0
30  %arrayidx.i.1 = getelementptr double, ptr %a, i64 %indvars.iv.next239.i
31  %1 = load double, ptr %arrayidx.i.1, align 8
32  %arrayidx10.i.1 = getelementptr double, ptr %a, i64 %0
33  %2 = or disjoint i64 %0, 1
34  %arrayidx17.i28.1 = getelementptr double, ptr %a, i64 %2
35  %3 = load double, ptr %arrayidx17.i28.1, align 8
36  %4 = load double, ptr %a, align 8
37  %5 = load double, ptr %a, align 8
38  %arrayidx38.i.1 = getelementptr double, ptr %a, i64 1
39  %6 = load double, ptr %arrayidx38.i.1, align 8
40  %arrayidx41.i.1 = getelementptr double, ptr %a, i64 1
41  %7 = load double, ptr %arrayidx41.i.1, align 8
42  %sub47.i.1 = fsub double %4, %5
43  %sub54.i.1 = fsub double %6, %7
44  %sub69.i.1 = fsub double %1, %sub54.i.1
45  store double %sub69.i.1, ptr %arrayidx10.i.1, align 8
46  %sub72.i.1 = fsub double %3, %sub47.i.1
47  store double %sub72.i.1, ptr %arrayidx17.i28.1, align 8
48  br label %bb
49}
50