xref: /llvm-project/llvm/test/CodeGen/AArch64/sms-mve1.mir (revision 0c5319e546321d7a766999e49e0ccf801ff2b3dc)
1# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 4
2# RUN: llc --verify-machineinstrs -mtriple=aarch64 -o - %s -run-pass pipeliner -aarch64-enable-pipeliner -pipeliner-mve-cg -pipeliner-force-ii=3 -mcpu=neoverse-n1 2>&1 | FileCheck %s
3
4# test pipeliner code genearation by MVE algorithm
5# #stages: 2, unroll count: 3
6
7# the calculation result can be checked as follows (driver code written by C):
8# for (i=2; i<N; i++)
9#   func_noswp(i, 1) == func(i, 1)
10
11...
12---
13name:            func
14tracksRegLiveness: true
15body:             |
16  ; CHECK-LABEL: name: func
17  ; CHECK: bb.0.entry:
18  ; CHECK-NEXT:   successors: %bb.3(0x80000000)
19  ; CHECK-NEXT:   liveins: $x0, $x1
20  ; CHECK-NEXT: {{  $}}
21  ; CHECK-NEXT:   [[COPY:%[0-9]+]]:gpr64 = COPY $x0
22  ; CHECK-NEXT:   [[COPY1:%[0-9]+]]:gpr64 = COPY $x1
23  ; CHECK-NEXT:   [[FMOVDi:%[0-9]+]]:fpr64 = FMOVDi 1
24  ; CHECK-NEXT:   B %bb.3
25  ; CHECK-NEXT: {{  $}}
26  ; CHECK-NEXT: bb.3:
27  ; CHECK-NEXT:   successors: %bb.4(0x40000000), %bb.7(0x40000000)
28  ; CHECK-NEXT: {{  $}}
29  ; CHECK-NEXT:   [[ADDXrr:%[0-9]+]]:gpr64 = ADDXrr [[COPY1]], [[COPY1]]
30  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr]], implicit-def $nzcv
31  ; CHECK-NEXT:   [[CSINCXr:%[0-9]+]]:gpr64common = CSINCXr $xzr, $xzr, 1, implicit $nzcv
32  ; CHECK-NEXT:   [[ADDXrr1:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr]], [[COPY1]]
33  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr1]], implicit-def $nzcv
34  ; CHECK-NEXT:   [[CSINCXr1:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr]], [[CSINCXr]], 1, implicit $nzcv
35  ; CHECK-NEXT:   [[ADDXrr2:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr1]], [[COPY1]]
36  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr2]], implicit-def $nzcv
37  ; CHECK-NEXT:   [[CSINCXr2:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr1]], [[CSINCXr1]], 1, implicit $nzcv
38  ; CHECK-NEXT:   [[ADDXrr3:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr2]], [[COPY1]]
39  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr3]], implicit-def $nzcv
40  ; CHECK-NEXT:   [[CSINCXr3:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr2]], [[CSINCXr2]], 1, implicit $nzcv
41  ; CHECK-NEXT:   dead $xzr = SUBSXri [[CSINCXr3]], 0, 0, implicit-def $nzcv
42  ; CHECK-NEXT:   Bcc 0, %bb.4, implicit $nzcv
43  ; CHECK-NEXT:   B %bb.7
44  ; CHECK-NEXT: {{  $}}
45  ; CHECK-NEXT: bb.4:
46  ; CHECK-NEXT:   successors: %bb.5(0x80000000)
47  ; CHECK-NEXT: {{  $}}
48  ; CHECK-NEXT:   [[FADDDrr:%[0-9]+]]:fpr64 = FADDDrr [[FMOVDi]], [[FMOVDi]], implicit $fpcr
49  ; CHECK-NEXT:   [[ADDXrr4:%[0-9]+]]:gpr64 = ADDXrr [[COPY1]], [[COPY1]]
50  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr4]], implicit-def $nzcv
51  ; CHECK-NEXT:   [[FADDDrr1:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr]], [[FMOVDi]], implicit $fpcr
52  ; CHECK-NEXT: {{  $}}
53  ; CHECK-NEXT: bb.5:
54  ; CHECK-NEXT:   successors: %bb.5(0x40000000), %bb.6(0x40000000)
55  ; CHECK-NEXT: {{  $}}
56  ; CHECK-NEXT:   [[PHI:%[0-9]+]]:fpr64 = PHI [[FADDDrr5:%[0-9]+]], %bb.5, [[FMOVDi]], %bb.4
57  ; CHECK-NEXT:   [[PHI1:%[0-9]+]]:gpr64 = PHI [[ADDXrr6:%[0-9]+]], %bb.5, [[COPY1]], %bb.4
58  ; CHECK-NEXT:   [[PHI2:%[0-9]+]]:fpr64 = PHI [[FADDDrr8:%[0-9]+]], %bb.5, [[FADDDrr]], %bb.4
59  ; CHECK-NEXT:   [[PHI3:%[0-9]+]]:gpr64 = PHI [[ADDXrr7:%[0-9]+]], %bb.5, [[ADDXrr4]], %bb.4
60  ; CHECK-NEXT:   [[PHI4:%[0-9]+]]:fpr64 = PHI [[FADDDrr10:%[0-9]+]], %bb.5, [[FADDDrr1]], %bb.4
61  ; CHECK-NEXT:   [[FADDDrr2:%[0-9]+]]:fpr64 = FADDDrr [[FMOVDi]], [[PHI2]], implicit $fpcr
62  ; CHECK-NEXT:   [[ADDXrr5:%[0-9]+]]:gpr64 = ADDXrr [[PHI3]], [[COPY1]]
63  ; CHECK-NEXT:   [[FADDDrr3:%[0-9]+]]:fpr64 = FADDDrr [[PHI4]], [[PHI]], implicit $fpcr
64  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr5]], implicit-def $nzcv
65  ; CHECK-NEXT:   [[FADDDrr4:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr2]], [[PHI2]], implicit $fpcr
66  ; CHECK-NEXT:   [[FADDDrr5]]:fpr64 = FADDDrr [[FMOVDi]], [[FADDDrr2]], implicit $fpcr
67  ; CHECK-NEXT:   [[ADDXrr6]]:gpr64 = ADDXrr [[ADDXrr5]], [[COPY1]]
68  ; CHECK-NEXT:   [[FADDDrr6:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr4]], [[PHI2]], implicit $fpcr
69  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr6]], implicit-def $nzcv
70  ; CHECK-NEXT:   [[FADDDrr7:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr5]], [[FADDDrr2]], implicit $fpcr
71  ; CHECK-NEXT:   [[FADDDrr8]]:fpr64 = FADDDrr [[FMOVDi]], [[FADDDrr5]], implicit $fpcr
72  ; CHECK-NEXT:   [[ADDXrr7]]:gpr64 = ADDXrr [[ADDXrr6]], [[COPY1]]
73  ; CHECK-NEXT:   [[FADDDrr9:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr7]], [[FADDDrr2]], implicit $fpcr
74  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr7]], implicit-def $nzcv
75  ; CHECK-NEXT:   [[FADDDrr10]]:fpr64 = FADDDrr [[FADDDrr8]], [[FADDDrr5]], implicit $fpcr
76  ; CHECK-NEXT:   [[CSINCXr4:%[0-9]+]]:gpr64common = CSINCXr $xzr, $xzr, 1, implicit $nzcv
77  ; CHECK-NEXT:   [[ADDXrr8:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr7]], [[COPY1]]
78  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr8]], implicit-def $nzcv
79  ; CHECK-NEXT:   [[CSINCXr5:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr4]], [[CSINCXr4]], 1, implicit $nzcv
80  ; CHECK-NEXT:   [[ADDXrr9:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr8]], [[COPY1]]
81  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr9]], implicit-def $nzcv
82  ; CHECK-NEXT:   [[CSINCXr6:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr5]], [[CSINCXr5]], 1, implicit $nzcv
83  ; CHECK-NEXT:   dead $xzr = SUBSXri [[CSINCXr6]], 0, 0, implicit-def $nzcv
84  ; CHECK-NEXT:   Bcc 0, %bb.5, implicit $nzcv
85  ; CHECK-NEXT:   B %bb.6
86  ; CHECK-NEXT: {{  $}}
87  ; CHECK-NEXT: bb.6:
88  ; CHECK-NEXT:   successors: %bb.7(0x40000000), %bb.2(0x40000000)
89  ; CHECK-NEXT: {{  $}}
90  ; CHECK-NEXT:   [[FADDDrr11:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr10]], [[FADDDrr5]], implicit $fpcr
91  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr7]], implicit-def $nzcv
92  ; CHECK-NEXT:   [[CSINCXr7:%[0-9]+]]:gpr64common = CSINCXr $xzr, $xzr, 1, implicit $nzcv
93  ; CHECK-NEXT:   dead $xzr = SUBSXri [[CSINCXr7]], 0, 0, implicit-def $nzcv
94  ; CHECK-NEXT:   Bcc 0, %bb.7, implicit $nzcv
95  ; CHECK-NEXT:   B %bb.2
96  ; CHECK-NEXT: {{  $}}
97  ; CHECK-NEXT: bb.7:
98  ; CHECK-NEXT:   successors: %bb.1(0x80000000)
99  ; CHECK-NEXT: {{  $}}
100  ; CHECK-NEXT:   [[PHI5:%[0-9]+]]:fpr64 = PHI [[FMOVDi]], %bb.3, [[FADDDrr8]], %bb.6
101  ; CHECK-NEXT:   [[PHI6:%[0-9]+]]:gpr64 = PHI [[COPY1]], %bb.3, [[ADDXrr7]], %bb.6
102  ; CHECK-NEXT:   B %bb.1
103  ; CHECK-NEXT: {{  $}}
104  ; CHECK-NEXT: bb.1:
105  ; CHECK-NEXT:   successors: %bb.1(0x40000000), %bb.2(0x40000000)
106  ; CHECK-NEXT: {{  $}}
107  ; CHECK-NEXT:   [[PHI7:%[0-9]+]]:gpr64 = PHI [[PHI6]], %bb.7, [[ADDXrr10:%[0-9]+]], %bb.1
108  ; CHECK-NEXT:   [[PHI8:%[0-9]+]]:fpr64 = PHI [[PHI5]], %bb.7, [[FADDDrr12:%[0-9]+]], %bb.1
109  ; CHECK-NEXT:   [[ADDXrr10]]:gpr64 = ADDXrr [[PHI7]], [[COPY1]]
110  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr10]], implicit-def $nzcv
111  ; CHECK-NEXT:   [[FADDDrr12]]:fpr64 = FADDDrr [[FMOVDi]], [[PHI8]], implicit $fpcr
112  ; CHECK-NEXT:   [[FADDDrr13:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr12]], [[PHI8]], implicit $fpcr
113  ; CHECK-NEXT:   [[FADDDrr14:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr13]], [[PHI8]], implicit $fpcr
114  ; CHECK-NEXT:   Bcc 1, %bb.1, implicit $nzcv
115  ; CHECK-NEXT:   B %bb.2
116  ; CHECK-NEXT: {{  $}}
117  ; CHECK-NEXT: bb.2:
118  ; CHECK-NEXT:   [[PHI9:%[0-9]+]]:fpr64 = PHI [[FADDDrr12]], %bb.1, [[FADDDrr8]], %bb.6
119  ; CHECK-NEXT:   [[PHI10:%[0-9]+]]:fpr64 = PHI [[FADDDrr14]], %bb.1, [[FADDDrr11]], %bb.6
120  ; CHECK-NEXT:   [[FMULDrr:%[0-9]+]]:fpr64 = FMULDrr [[PHI9]], [[PHI10]], implicit $fpcr
121  ; CHECK-NEXT:   $d0 = COPY [[FMULDrr]]
122  ; CHECK-NEXT:   RET_ReallyLR implicit $d0
123  bb.0.entry:
124    liveins: $x0, $x1
125    %10:gpr64 = COPY $x0
126    %11:gpr64 = COPY $x1
127    %20:fpr64 = FMOVDi 1
128
129  bb.1:
130    %12:gpr64 = PHI %11, %bb.0, %13, %bb.1
131    %24:fpr64 = PHI %20, %bb.0, %21, %bb.1
132    %13:gpr64 = ADDXrr %12, %11
133    dead $xzr = SUBSXrr %10, %13, implicit-def $nzcv
134    %21:fpr64 = FADDDrr %20, %24, implicit $fpcr
135    %22:fpr64 = FADDDrr %21, %24, implicit $fpcr
136    %23:fpr64 = FADDDrr %22, %24, implicit $fpcr
137    Bcc 1, %bb.1, implicit $nzcv
138    B %bb.2
139
140  bb.2:
141    %25:fpr64 = FMULDrr %21, %23, implicit $fpcr
142    $d0 = COPY %25
143    RET_ReallyLR implicit $d0
144...
145