xref: /llvm-project/llvm/test/CodeGen/AArch64/sms-mve6.mir (revision 0c5319e546321d7a766999e49e0ccf801ff2b3dc)
1# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 4
2# RUN: llc --verify-machineinstrs -mtriple=aarch64 -o - %s -run-pass pipeliner -aarch64-enable-pipeliner -pipeliner-mve-cg -pipeliner-force-ii=3 -mcpu=neoverse-n1 2>&1 | FileCheck %s
3
4# test pipeliner code genearation by MVE algorithm
5# #stages: 2, unroll count: 3
6
7...
8---
9name:            func
10tracksRegLiveness: true
11body:             |
12  ; CHECK-LABEL: name: func
13  ; CHECK: bb.0.entry:
14  ; CHECK-NEXT:   successors: %bb.3(0x80000000)
15  ; CHECK-NEXT:   liveins: $x0, $x1
16  ; CHECK-NEXT: {{  $}}
17  ; CHECK-NEXT:   [[COPY:%[0-9]+]]:gpr64 = COPY $x0
18  ; CHECK-NEXT:   [[COPY1:%[0-9]+]]:gpr64 = COPY $x1
19  ; CHECK-NEXT:   [[FMOVDi:%[0-9]+]]:fpr64 = FMOVDi 1
20  ; CHECK-NEXT:   B %bb.3
21  ; CHECK-NEXT: {{  $}}
22  ; CHECK-NEXT: bb.3:
23  ; CHECK-NEXT:   successors: %bb.4(0x40000000), %bb.7(0x40000000)
24  ; CHECK-NEXT: {{  $}}
25  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[COPY1]], implicit-def $nzcv
26  ; CHECK-NEXT:   [[CSINCXr:%[0-9]+]]:gpr64common = CSINCXr $xzr, $xzr, 1, implicit $nzcv
27  ; CHECK-NEXT:   [[ADDXrr:%[0-9]+]]:gpr64 = ADDXrr [[COPY1]], [[COPY1]]
28  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr]], implicit-def $nzcv
29  ; CHECK-NEXT:   [[CSINCXr1:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr]], [[CSINCXr]], 1, implicit $nzcv
30  ; CHECK-NEXT:   [[ADDXrr1:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr]], [[COPY1]]
31  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr1]], implicit-def $nzcv
32  ; CHECK-NEXT:   [[CSINCXr2:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr1]], [[CSINCXr1]], 1, implicit $nzcv
33  ; CHECK-NEXT:   [[ADDXrr2:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr1]], [[COPY1]]
34  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr2]], implicit-def $nzcv
35  ; CHECK-NEXT:   [[CSINCXr3:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr2]], [[CSINCXr2]], 1, implicit $nzcv
36  ; CHECK-NEXT:   dead $xzr = SUBSXri [[CSINCXr3]], 0, 0, implicit-def $nzcv
37  ; CHECK-NEXT:   Bcc 0, %bb.4, implicit $nzcv
38  ; CHECK-NEXT:   B %bb.7
39  ; CHECK-NEXT: {{  $}}
40  ; CHECK-NEXT: bb.4:
41  ; CHECK-NEXT:   successors: %bb.5(0x80000000)
42  ; CHECK-NEXT: {{  $}}
43  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[COPY1]], implicit-def $nzcv
44  ; CHECK-NEXT:   [[FADDDrr:%[0-9]+]]:fpr64 = FADDDrr [[FMOVDi]], [[FMOVDi]], implicit $fpcr
45  ; CHECK-NEXT:   [[ADDXrr3:%[0-9]+]]:gpr64 = ADDXrr [[COPY1]], [[COPY1]]
46  ; CHECK-NEXT:   [[FADDDrr1:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr]], [[FMOVDi]], implicit $fpcr
47  ; CHECK-NEXT: {{  $}}
48  ; CHECK-NEXT: bb.5:
49  ; CHECK-NEXT:   successors: %bb.5(0x40000000), %bb.6(0x40000000)
50  ; CHECK-NEXT: {{  $}}
51  ; CHECK-NEXT:   [[PHI:%[0-9]+]]:fpr64 = PHI [[FADDDrr5:%[0-9]+]], %bb.5, [[FMOVDi]], %bb.4
52  ; CHECK-NEXT:   [[PHI1:%[0-9]+]]:gpr64 = PHI [[ADDXrr5:%[0-9]+]], %bb.5, [[COPY1]], %bb.4
53  ; CHECK-NEXT:   [[PHI2:%[0-9]+]]:fpr64 = PHI [[FADDDrr8:%[0-9]+]], %bb.5, [[FADDDrr]], %bb.4
54  ; CHECK-NEXT:   [[PHI3:%[0-9]+]]:gpr64 = PHI [[ADDXrr6:%[0-9]+]], %bb.5, [[ADDXrr3]], %bb.4
55  ; CHECK-NEXT:   [[PHI4:%[0-9]+]]:fpr64 = PHI [[FADDDrr10:%[0-9]+]], %bb.5, [[FADDDrr1]], %bb.4
56  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[PHI3]], implicit-def $nzcv
57  ; CHECK-NEXT:   [[FADDDrr2:%[0-9]+]]:fpr64 = FADDDrr [[FMOVDi]], [[PHI2]], implicit $fpcr
58  ; CHECK-NEXT:   [[ADDXrr4:%[0-9]+]]:gpr64 = ADDXrr [[PHI3]], [[COPY1]]
59  ; CHECK-NEXT:   [[FADDDrr3:%[0-9]+]]:fpr64 = FADDDrr [[PHI4]], [[PHI]], implicit $fpcr
60  ; CHECK-NEXT:   [[FADDDrr4:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr2]], [[PHI2]], implicit $fpcr
61  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr4]], implicit-def $nzcv
62  ; CHECK-NEXT:   [[FADDDrr5]]:fpr64 = FADDDrr [[FMOVDi]], [[FADDDrr2]], implicit $fpcr
63  ; CHECK-NEXT:   [[ADDXrr5]]:gpr64 = ADDXrr [[ADDXrr4]], [[COPY1]]
64  ; CHECK-NEXT:   [[FADDDrr6:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr4]], [[PHI2]], implicit $fpcr
65  ; CHECK-NEXT:   [[FADDDrr7:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr5]], [[FADDDrr2]], implicit $fpcr
66  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr5]], implicit-def $nzcv
67  ; CHECK-NEXT:   [[FADDDrr8]]:fpr64 = FADDDrr [[FMOVDi]], [[FADDDrr5]], implicit $fpcr
68  ; CHECK-NEXT:   [[ADDXrr6]]:gpr64 = ADDXrr [[ADDXrr5]], [[COPY1]]
69  ; CHECK-NEXT:   [[FADDDrr9:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr7]], [[FADDDrr2]], implicit $fpcr
70  ; CHECK-NEXT:   [[FADDDrr10]]:fpr64 = FADDDrr [[FADDDrr8]], [[FADDDrr5]], implicit $fpcr
71  ; CHECK-NEXT:   [[CSINCXr4:%[0-9]+]]:gpr64common = CSINCXr $xzr, $xzr, 1, implicit $nzcv
72  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr6]], implicit-def $nzcv
73  ; CHECK-NEXT:   [[CSINCXr5:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr4]], [[CSINCXr4]], 1, implicit $nzcv
74  ; CHECK-NEXT:   [[ADDXrr7:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr6]], [[COPY1]]
75  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr7]], implicit-def $nzcv
76  ; CHECK-NEXT:   [[CSINCXr6:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr5]], [[CSINCXr5]], 1, implicit $nzcv
77  ; CHECK-NEXT:   dead $xzr = SUBSXri [[CSINCXr6]], 0, 0, implicit-def $nzcv
78  ; CHECK-NEXT:   Bcc 0, %bb.5, implicit $nzcv
79  ; CHECK-NEXT:   B %bb.6
80  ; CHECK-NEXT: {{  $}}
81  ; CHECK-NEXT: bb.6:
82  ; CHECK-NEXT:   successors: %bb.7(0x40000000), %bb.2(0x40000000)
83  ; CHECK-NEXT: {{  $}}
84  ; CHECK-NEXT:   [[FADDDrr11:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr10]], [[FADDDrr5]], implicit $fpcr
85  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[ADDXrr5]], implicit-def $nzcv
86  ; CHECK-NEXT:   [[CSINCXr7:%[0-9]+]]:gpr64common = CSINCXr $xzr, $xzr, 1, implicit $nzcv
87  ; CHECK-NEXT:   dead $xzr = SUBSXri [[CSINCXr7]], 0, 0, implicit-def $nzcv
88  ; CHECK-NEXT:   Bcc 0, %bb.7, implicit $nzcv
89  ; CHECK-NEXT:   B %bb.2
90  ; CHECK-NEXT: {{  $}}
91  ; CHECK-NEXT: bb.7:
92  ; CHECK-NEXT:   successors: %bb.1(0x80000000)
93  ; CHECK-NEXT: {{  $}}
94  ; CHECK-NEXT:   [[PHI5:%[0-9]+]]:fpr64 = PHI [[FMOVDi]], %bb.3, [[FADDDrr8]], %bb.6
95  ; CHECK-NEXT:   [[PHI6:%[0-9]+]]:gpr64 = PHI [[COPY1]], %bb.3, [[ADDXrr6]], %bb.6
96  ; CHECK-NEXT:   B %bb.1
97  ; CHECK-NEXT: {{  $}}
98  ; CHECK-NEXT: bb.1:
99  ; CHECK-NEXT:   successors: %bb.1(0x40000000), %bb.2(0x40000000)
100  ; CHECK-NEXT: {{  $}}
101  ; CHECK-NEXT:   [[PHI7:%[0-9]+]]:gpr64 = PHI [[PHI6]], %bb.7, [[ADDXrr8:%[0-9]+]], %bb.1
102  ; CHECK-NEXT:   [[PHI8:%[0-9]+]]:fpr64 = PHI [[PHI5]], %bb.7, [[FADDDrr12:%[0-9]+]], %bb.1
103  ; CHECK-NEXT:   dead $xzr = SUBSXrr [[COPY]], [[PHI7]], implicit-def $nzcv
104  ; CHECK-NEXT:   [[ADDXrr8]]:gpr64 = ADDXrr [[PHI7]], [[COPY1]]
105  ; CHECK-NEXT:   [[FADDDrr12]]:fpr64 = FADDDrr [[FMOVDi]], [[PHI8]], implicit $fpcr
106  ; CHECK-NEXT:   [[FADDDrr13:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr12]], [[PHI8]], implicit $fpcr
107  ; CHECK-NEXT:   [[FADDDrr14:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr13]], [[PHI8]], implicit $fpcr
108  ; CHECK-NEXT:   Bcc 1, %bb.1, implicit $nzcv
109  ; CHECK-NEXT:   B %bb.2
110  ; CHECK-NEXT: {{  $}}
111  ; CHECK-NEXT: bb.2:
112  ; CHECK-NEXT:   [[PHI9:%[0-9]+]]:fpr64 = PHI [[FADDDrr12]], %bb.1, [[FADDDrr8]], %bb.6
113  ; CHECK-NEXT:   [[PHI10:%[0-9]+]]:fpr64 = PHI [[FADDDrr14]], %bb.1, [[FADDDrr11]], %bb.6
114  ; CHECK-NEXT:   [[FMULDrr:%[0-9]+]]:fpr64 = FMULDrr [[PHI9]], [[PHI10]], implicit $fpcr
115  ; CHECK-NEXT:   $d0 = COPY [[FMULDrr]]
116  ; CHECK-NEXT:   RET_ReallyLR implicit $d0
117  bb.0.entry:
118    liveins: $x0, $x1
119    %10:gpr64 = COPY $x0
120    %11:gpr64 = COPY $x1
121    %20:fpr64 = FMOVDi 1
122
123  bb.1:
124    %12:gpr64 = PHI %11, %bb.0, %13, %bb.1
125    %24:fpr64 = PHI %20, %bb.0, %21, %bb.1
126    dead $xzr = SUBSXrr %10, %12, implicit-def $nzcv
127    %13:gpr64 = ADDXrr %12, %11
128    %21:fpr64 = FADDDrr %20, %24, implicit $fpcr
129    %22:fpr64 = FADDDrr %21, %24, implicit $fpcr
130    %23:fpr64 = FADDDrr %22, %24, implicit $fpcr
131    Bcc 1, %bb.1, implicit $nzcv
132    B %bb.2
133
134  bb.2:
135    %25:fpr64 = FMULDrr %21, %23, implicit $fpcr
136    $d0 = COPY %25
137    RET_ReallyLR implicit $d0
138...
139