1# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 4 2# RUN: llc --verify-machineinstrs -mtriple=aarch64 -o - %s -run-pass pipeliner -aarch64-enable-pipeliner -pipeliner-mve-cg -pipeliner-force-ii=3 -mcpu=neoverse-n1 2>&1 | FileCheck %s 3 4# test pipeliner code genearation by MVE algorithm 5# #stages: 2, unroll count: 3 6 7# the calculation result can be checked as follows (driver code written by C): 8# for (i=2; i<N; i++) 9# func_noswp(i, 1) == func(i, 1) 10 11... 12--- 13name: func 14tracksRegLiveness: true 15body: | 16 ; CHECK-LABEL: name: func 17 ; CHECK: bb.0.entry: 18 ; CHECK-NEXT: successors: %bb.3(0x80000000) 19 ; CHECK-NEXT: liveins: $x0, $x1 20 ; CHECK-NEXT: {{ $}} 21 ; CHECK-NEXT: [[COPY:%[0-9]+]]:gpr64 = COPY $x0 22 ; CHECK-NEXT: [[COPY1:%[0-9]+]]:gpr64 = COPY $x1 23 ; CHECK-NEXT: [[FMOVDi:%[0-9]+]]:fpr64 = FMOVDi 1 24 ; CHECK-NEXT: B %bb.3 25 ; CHECK-NEXT: {{ $}} 26 ; CHECK-NEXT: bb.3: 27 ; CHECK-NEXT: successors: %bb.4(0x40000000), %bb.7(0x40000000) 28 ; CHECK-NEXT: {{ $}} 29 ; CHECK-NEXT: [[ADDXrr:%[0-9]+]]:gpr64 = ADDXrr [[COPY1]], [[COPY1]] 30 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr]], implicit-def $nzcv 31 ; CHECK-NEXT: [[CSINCXr:%[0-9]+]]:gpr64common = CSINCXr $xzr, $xzr, 1, implicit $nzcv 32 ; CHECK-NEXT: [[ADDXrr1:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr]], [[COPY1]] 33 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr1]], implicit-def $nzcv 34 ; CHECK-NEXT: [[CSINCXr1:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr]], [[CSINCXr]], 1, implicit $nzcv 35 ; CHECK-NEXT: [[ADDXrr2:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr1]], [[COPY1]] 36 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr2]], implicit-def $nzcv 37 ; CHECK-NEXT: [[CSINCXr2:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr1]], [[CSINCXr1]], 1, implicit $nzcv 38 ; CHECK-NEXT: [[ADDXrr3:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr2]], [[COPY1]] 39 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr3]], implicit-def $nzcv 40 ; CHECK-NEXT: [[CSINCXr3:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr2]], [[CSINCXr2]], 1, implicit $nzcv 41 ; CHECK-NEXT: dead $xzr = SUBSXri [[CSINCXr3]], 0, 0, implicit-def $nzcv 42 ; CHECK-NEXT: Bcc 0, %bb.4, implicit $nzcv 43 ; CHECK-NEXT: B %bb.7 44 ; CHECK-NEXT: {{ $}} 45 ; CHECK-NEXT: bb.4: 46 ; CHECK-NEXT: successors: %bb.5(0x80000000) 47 ; CHECK-NEXT: {{ $}} 48 ; CHECK-NEXT: [[FADDDrr:%[0-9]+]]:fpr64 = FADDDrr [[FMOVDi]], [[FMOVDi]], implicit $fpcr 49 ; CHECK-NEXT: [[ADDXrr4:%[0-9]+]]:gpr64 = ADDXrr [[COPY1]], [[COPY1]] 50 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr4]], implicit-def $nzcv 51 ; CHECK-NEXT: [[FADDDrr1:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr]], [[FMOVDi]], implicit $fpcr 52 ; CHECK-NEXT: {{ $}} 53 ; CHECK-NEXT: bb.5: 54 ; CHECK-NEXT: successors: %bb.5(0x40000000), %bb.6(0x40000000) 55 ; CHECK-NEXT: {{ $}} 56 ; CHECK-NEXT: [[PHI:%[0-9]+]]:fpr64 = PHI [[FADDDrr5:%[0-9]+]], %bb.5, [[FMOVDi]], %bb.4 57 ; CHECK-NEXT: [[PHI1:%[0-9]+]]:gpr64 = PHI [[ADDXrr6:%[0-9]+]], %bb.5, [[COPY1]], %bb.4 58 ; CHECK-NEXT: [[PHI2:%[0-9]+]]:fpr64 = PHI [[FADDDrr8:%[0-9]+]], %bb.5, [[FADDDrr]], %bb.4 59 ; CHECK-NEXT: [[PHI3:%[0-9]+]]:gpr64 = PHI [[ADDXrr7:%[0-9]+]], %bb.5, [[ADDXrr4]], %bb.4 60 ; CHECK-NEXT: [[PHI4:%[0-9]+]]:fpr64 = PHI [[FADDDrr10:%[0-9]+]], %bb.5, [[FADDDrr1]], %bb.4 61 ; CHECK-NEXT: [[FADDDrr2:%[0-9]+]]:fpr64 = FADDDrr [[FMOVDi]], [[PHI2]], implicit $fpcr 62 ; CHECK-NEXT: [[ADDXrr5:%[0-9]+]]:gpr64 = ADDXrr [[PHI3]], [[COPY1]] 63 ; CHECK-NEXT: [[FADDDrr3:%[0-9]+]]:fpr64 = FADDDrr [[PHI4]], [[PHI]], implicit $fpcr 64 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr5]], implicit-def $nzcv 65 ; CHECK-NEXT: [[FADDDrr4:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr2]], [[PHI2]], implicit $fpcr 66 ; CHECK-NEXT: [[FADDDrr5]]:fpr64 = FADDDrr [[FMOVDi]], [[FADDDrr2]], implicit $fpcr 67 ; CHECK-NEXT: [[ADDXrr6]]:gpr64 = ADDXrr [[ADDXrr5]], [[COPY1]] 68 ; CHECK-NEXT: [[FADDDrr6:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr4]], [[PHI2]], implicit $fpcr 69 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr6]], implicit-def $nzcv 70 ; CHECK-NEXT: [[FADDDrr7:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr5]], [[FADDDrr2]], implicit $fpcr 71 ; CHECK-NEXT: [[FADDDrr8]]:fpr64 = FADDDrr [[FMOVDi]], [[FADDDrr5]], implicit $fpcr 72 ; CHECK-NEXT: [[ADDXrr7]]:gpr64 = ADDXrr [[ADDXrr6]], [[COPY1]] 73 ; CHECK-NEXT: [[FADDDrr9:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr7]], [[FADDDrr2]], implicit $fpcr 74 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr7]], implicit-def $nzcv 75 ; CHECK-NEXT: [[FADDDrr10]]:fpr64 = FADDDrr [[FADDDrr8]], [[FADDDrr5]], implicit $fpcr 76 ; CHECK-NEXT: [[CSINCXr4:%[0-9]+]]:gpr64common = CSINCXr $xzr, $xzr, 1, implicit $nzcv 77 ; CHECK-NEXT: [[ADDXrr8:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr7]], [[COPY1]] 78 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr8]], implicit-def $nzcv 79 ; CHECK-NEXT: [[CSINCXr5:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr4]], [[CSINCXr4]], 1, implicit $nzcv 80 ; CHECK-NEXT: [[ADDXrr9:%[0-9]+]]:gpr64 = ADDXrr [[ADDXrr8]], [[COPY1]] 81 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr9]], implicit-def $nzcv 82 ; CHECK-NEXT: [[CSINCXr6:%[0-9]+]]:gpr64common = CSINCXr [[CSINCXr5]], [[CSINCXr5]], 1, implicit $nzcv 83 ; CHECK-NEXT: dead $xzr = SUBSXri [[CSINCXr6]], 0, 0, implicit-def $nzcv 84 ; CHECK-NEXT: Bcc 0, %bb.5, implicit $nzcv 85 ; CHECK-NEXT: B %bb.6 86 ; CHECK-NEXT: {{ $}} 87 ; CHECK-NEXT: bb.6: 88 ; CHECK-NEXT: successors: %bb.7(0x40000000), %bb.2(0x40000000) 89 ; CHECK-NEXT: {{ $}} 90 ; CHECK-NEXT: [[FADDDrr11:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr10]], [[FADDDrr5]], implicit $fpcr 91 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr7]], implicit-def $nzcv 92 ; CHECK-NEXT: [[CSINCXr7:%[0-9]+]]:gpr64common = CSINCXr $xzr, $xzr, 1, implicit $nzcv 93 ; CHECK-NEXT: dead $xzr = SUBSXri [[CSINCXr7]], 0, 0, implicit-def $nzcv 94 ; CHECK-NEXT: Bcc 0, %bb.7, implicit $nzcv 95 ; CHECK-NEXT: B %bb.2 96 ; CHECK-NEXT: {{ $}} 97 ; CHECK-NEXT: bb.7: 98 ; CHECK-NEXT: successors: %bb.1(0x80000000) 99 ; CHECK-NEXT: {{ $}} 100 ; CHECK-NEXT: [[PHI5:%[0-9]+]]:fpr64 = PHI [[FMOVDi]], %bb.3, [[FADDDrr8]], %bb.6 101 ; CHECK-NEXT: [[PHI6:%[0-9]+]]:gpr64 = PHI [[COPY1]], %bb.3, [[ADDXrr7]], %bb.6 102 ; CHECK-NEXT: B %bb.1 103 ; CHECK-NEXT: {{ $}} 104 ; CHECK-NEXT: bb.1: 105 ; CHECK-NEXT: successors: %bb.1(0x40000000), %bb.2(0x40000000) 106 ; CHECK-NEXT: {{ $}} 107 ; CHECK-NEXT: [[PHI7:%[0-9]+]]:gpr64 = PHI [[PHI6]], %bb.7, [[ADDXrr10:%[0-9]+]], %bb.1 108 ; CHECK-NEXT: [[PHI8:%[0-9]+]]:fpr64 = PHI [[PHI5]], %bb.7, [[FADDDrr12:%[0-9]+]], %bb.1 109 ; CHECK-NEXT: [[ADDXrr10]]:gpr64 = ADDXrr [[PHI7]], [[COPY1]] 110 ; CHECK-NEXT: dead $xzr = SUBSXrr [[COPY]], [[ADDXrr10]], implicit-def $nzcv 111 ; CHECK-NEXT: [[FADDDrr12]]:fpr64 = FADDDrr [[FMOVDi]], [[PHI8]], implicit $fpcr 112 ; CHECK-NEXT: [[FADDDrr13:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr12]], [[PHI8]], implicit $fpcr 113 ; CHECK-NEXT: [[FADDDrr14:%[0-9]+]]:fpr64 = FADDDrr [[FADDDrr13]], [[PHI8]], implicit $fpcr 114 ; CHECK-NEXT: Bcc 1, %bb.1, implicit $nzcv 115 ; CHECK-NEXT: B %bb.2 116 ; CHECK-NEXT: {{ $}} 117 ; CHECK-NEXT: bb.2: 118 ; CHECK-NEXT: [[PHI9:%[0-9]+]]:fpr64 = PHI [[FADDDrr12]], %bb.1, [[FADDDrr8]], %bb.6 119 ; CHECK-NEXT: [[PHI10:%[0-9]+]]:fpr64 = PHI [[FADDDrr14]], %bb.1, [[FADDDrr11]], %bb.6 120 ; CHECK-NEXT: [[FMULDrr:%[0-9]+]]:fpr64 = FMULDrr [[PHI9]], [[PHI10]], implicit $fpcr 121 ; CHECK-NEXT: $d0 = COPY [[FMULDrr]] 122 ; CHECK-NEXT: RET_ReallyLR implicit $d0 123 bb.0.entry: 124 liveins: $x0, $x1 125 %10:gpr64 = COPY $x0 126 %11:gpr64 = COPY $x1 127 %20:fpr64 = FMOVDi 1 128 129 bb.1: 130 %12:gpr64 = PHI %11, %bb.0, %13, %bb.1 131 %24:fpr64 = PHI %20, %bb.0, %21, %bb.1 132 %13:gpr64 = ADDXrr %12, %11 133 dead $xzr = SUBSXrr %10, %13, implicit-def $nzcv 134 %21:fpr64 = FADDDrr %20, %24, implicit $fpcr 135 %22:fpr64 = FADDDrr %21, %24, implicit $fpcr 136 %23:fpr64 = FADDDrr %22, %24, implicit $fpcr 137 Bcc 1, %bb.1, implicit $nzcv 138 B %bb.2 139 140 bb.2: 141 %25:fpr64 = FMULDrr %21, %23, implicit $fpcr 142 $d0 = COPY %25 143 RET_ReallyLR implicit $d0 144... 145