1# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py 2# RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=hawaii -run-pass=legalizer -verify-machineinstrs -o - %s | FileCheck -check-prefix=GFX7 %s 3 4--- | 5 6 define <2 x i16> @and_v2i16(<2 x i16> %a, <2 x i16> %b) #0 { 7 %and = and <2 x i16> %a, %b 8 ret <2 x i16> %and 9 } 10 11 define <3 x i16> @add_v3i16(<3 x i16> %a, <3 x i16> %b) #0 { 12 %add = add <3 x i16> %a, %b 13 ret <3 x i16> %add 14 } 15 16 define <3 x i16> @shl_v3i16(<3 x i16> %a, <3 x i16> %b) #0 { 17 %shl = shl <3 x i16> %a, %b 18 ret <3 x i16> %shl 19 } 20 21 define <4 x half> @fma_v4f16(<4 x half> %a, <4 x half> %b, <4 x half> %c) { 22 %fma = call <4 x half> @llvm.fma.v4f16(<4 x half> %a, <4 x half> %b, <4 x half> %c) 23 ret <4 x half> %fma 24 } 25 26 define amdgpu_ps <5 x half> @maxnum_v5i16(<5 x half> %a, <5 x half> %b) { 27 %fma = call <5 x half> @llvm.maxnum.v5f16(<5 x half> %a, <5 x half> %b) 28 ret <5 x half> %fma 29 } 30 31 declare <4 x half> @llvm.fma.v4f16(<4 x half>, <4 x half>, <4 x half>) 32 declare <5 x half> @llvm.maxnum.v5f16(<5 x half>, <5 x half>) 33... 34 35--- 36name: and_v2i16 37body: | 38 bb.1: 39 liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3 40 41 ; GFX7-LABEL: name: and_v2i16 42 ; GFX7: liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3 43 ; GFX7-NEXT: {{ $}} 44 ; GFX7-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 45 ; GFX7-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 46 ; GFX7-NEXT: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s32>) = G_BUILD_VECTOR [[COPY]](s32), [[COPY1]](s32) 47 ; GFX7-NEXT: [[TRUNC:%[0-9]+]]:_(<2 x s16>) = G_TRUNC [[BUILD_VECTOR]](<2 x s32>) 48 ; GFX7-NEXT: [[COPY2:%[0-9]+]]:_(s32) = COPY $vgpr2 49 ; GFX7-NEXT: [[COPY3:%[0-9]+]]:_(s32) = COPY $vgpr3 50 ; GFX7-NEXT: [[BUILD_VECTOR1:%[0-9]+]]:_(<2 x s32>) = G_BUILD_VECTOR [[COPY2]](s32), [[COPY3]](s32) 51 ; GFX7-NEXT: [[TRUNC1:%[0-9]+]]:_(<2 x s16>) = G_TRUNC [[BUILD_VECTOR1]](<2 x s32>) 52 ; GFX7-NEXT: [[AND:%[0-9]+]]:_(<2 x s16>) = G_AND [[TRUNC]], [[TRUNC1]] 53 ; GFX7-NEXT: [[BITCAST:%[0-9]+]]:_(s32) = G_BITCAST [[AND]](<2 x s16>) 54 ; GFX7-NEXT: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 16 55 ; GFX7-NEXT: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[BITCAST]], [[C]](s32) 56 ; GFX7-NEXT: $vgpr0 = COPY [[BITCAST]](s32) 57 ; GFX7-NEXT: $vgpr1 = COPY [[LSHR]](s32) 58 ; GFX7-NEXT: SI_RETURN implicit $vgpr0, implicit $vgpr1 59 %3:_(s32) = COPY $vgpr0 60 %4:_(s32) = COPY $vgpr1 61 %5:_(<2 x s32>) = G_BUILD_VECTOR %3(s32), %4(s32) 62 %0:_(<2 x s16>) = G_TRUNC %5(<2 x s32>) 63 %6:_(s32) = COPY $vgpr2 64 %7:_(s32) = COPY $vgpr3 65 %8:_(<2 x s32>) = G_BUILD_VECTOR %6(s32), %7(s32) 66 %1:_(<2 x s16>) = G_TRUNC %8(<2 x s32>) 67 %9:_(<2 x s16>) = G_AND %0, %1 68 %13:_(s16), %14:_(s16) = G_UNMERGE_VALUES %9(<2 x s16>) 69 %11:_(s32) = G_ANYEXT %13(s16) 70 %12:_(s32) = G_ANYEXT %14(s16) 71 $vgpr0 = COPY %11(s32) 72 $vgpr1 = COPY %12(s32) 73 SI_RETURN implicit $vgpr0, implicit $vgpr1 74 75... 76 77--- 78name: add_v3i16 79body: | 80 bb.1: 81 liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4, $vgpr5 82 83 ; GFX7-LABEL: name: add_v3i16 84 ; GFX7: liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4, $vgpr5 85 ; GFX7-NEXT: {{ $}} 86 ; GFX7-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 87 ; GFX7-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 88 ; GFX7-NEXT: [[COPY2:%[0-9]+]]:_(s32) = COPY $vgpr2 89 ; GFX7-NEXT: [[COPY3:%[0-9]+]]:_(s32) = COPY $vgpr3 90 ; GFX7-NEXT: [[COPY4:%[0-9]+]]:_(s32) = COPY $vgpr4 91 ; GFX7-NEXT: [[COPY5:%[0-9]+]]:_(s32) = COPY $vgpr5 92 ; GFX7-NEXT: [[ADD:%[0-9]+]]:_(s32) = G_ADD [[COPY]], [[COPY3]] 93 ; GFX7-NEXT: [[ADD1:%[0-9]+]]:_(s32) = G_ADD [[COPY1]], [[COPY4]] 94 ; GFX7-NEXT: [[ADD2:%[0-9]+]]:_(s32) = G_ADD [[COPY2]], [[COPY5]] 95 ; GFX7-NEXT: $vgpr0 = COPY [[ADD]](s32) 96 ; GFX7-NEXT: $vgpr1 = COPY [[ADD1]](s32) 97 ; GFX7-NEXT: $vgpr2 = COPY [[ADD2]](s32) 98 ; GFX7-NEXT: SI_RETURN implicit $vgpr0, implicit $vgpr1, implicit $vgpr2 99 %3:_(s32) = COPY $vgpr0 100 %4:_(s32) = COPY $vgpr1 101 %5:_(s32) = COPY $vgpr2 102 %6:_(<3 x s32>) = G_BUILD_VECTOR %3(s32), %4(s32), %5(s32) 103 %0:_(<3 x s16>) = G_TRUNC %6(<3 x s32>) 104 %7:_(s32) = COPY $vgpr3 105 %8:_(s32) = COPY $vgpr4 106 %9:_(s32) = COPY $vgpr5 107 %10:_(<3 x s32>) = G_BUILD_VECTOR %7(s32), %8(s32), %9(s32) 108 %1:_(<3 x s16>) = G_TRUNC %10(<3 x s32>) 109 %11:_(<3 x s16>) = G_ADD %0, %1 110 %16:_(s16), %17:_(s16), %18:_(s16) = G_UNMERGE_VALUES %11(<3 x s16>) 111 %13:_(s32) = G_ANYEXT %16(s16) 112 %14:_(s32) = G_ANYEXT %17(s16) 113 %15:_(s32) = G_ANYEXT %18(s16) 114 $vgpr0 = COPY %13(s32) 115 $vgpr1 = COPY %14(s32) 116 $vgpr2 = COPY %15(s32) 117 SI_RETURN implicit $vgpr0, implicit $vgpr1, implicit $vgpr2 118 119... 120 121--- 122name: shl_v3i16 123body: | 124 bb.1: 125 liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4, $vgpr5 126 127 ; GFX7-LABEL: name: shl_v3i16 128 ; GFX7: liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4, $vgpr5 129 ; GFX7-NEXT: {{ $}} 130 ; GFX7-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 131 ; GFX7-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 132 ; GFX7-NEXT: [[COPY2:%[0-9]+]]:_(s32) = COPY $vgpr2 133 ; GFX7-NEXT: [[COPY3:%[0-9]+]]:_(s32) = COPY $vgpr3 134 ; GFX7-NEXT: [[COPY4:%[0-9]+]]:_(s32) = COPY $vgpr4 135 ; GFX7-NEXT: [[COPY5:%[0-9]+]]:_(s32) = COPY $vgpr5 136 ; GFX7-NEXT: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535 137 ; GFX7-NEXT: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY3]], [[C]] 138 ; GFX7-NEXT: [[SHL:%[0-9]+]]:_(s32) = G_SHL [[COPY]], [[AND]](s32) 139 ; GFX7-NEXT: [[AND1:%[0-9]+]]:_(s32) = G_AND [[COPY4]], [[C]] 140 ; GFX7-NEXT: [[SHL1:%[0-9]+]]:_(s32) = G_SHL [[COPY1]], [[AND1]](s32) 141 ; GFX7-NEXT: [[AND2:%[0-9]+]]:_(s32) = G_AND [[COPY5]], [[C]] 142 ; GFX7-NEXT: [[SHL2:%[0-9]+]]:_(s32) = G_SHL [[COPY2]], [[AND2]](s32) 143 ; GFX7-NEXT: $vgpr0 = COPY [[SHL]](s32) 144 ; GFX7-NEXT: $vgpr1 = COPY [[SHL1]](s32) 145 ; GFX7-NEXT: $vgpr2 = COPY [[SHL2]](s32) 146 ; GFX7-NEXT: SI_RETURN implicit $vgpr0, implicit $vgpr1, implicit $vgpr2 147 %3:_(s32) = COPY $vgpr0 148 %4:_(s32) = COPY $vgpr1 149 %5:_(s32) = COPY $vgpr2 150 %6:_(<3 x s32>) = G_BUILD_VECTOR %3(s32), %4(s32), %5(s32) 151 %0:_(<3 x s16>) = G_TRUNC %6(<3 x s32>) 152 %7:_(s32) = COPY $vgpr3 153 %8:_(s32) = COPY $vgpr4 154 %9:_(s32) = COPY $vgpr5 155 %10:_(<3 x s32>) = G_BUILD_VECTOR %7(s32), %8(s32), %9(s32) 156 %1:_(<3 x s16>) = G_TRUNC %10(<3 x s32>) 157 %11:_(<3 x s16>) = G_SHL %0, %1(<3 x s16>) 158 %16:_(s16), %17:_(s16), %18:_(s16) = G_UNMERGE_VALUES %11(<3 x s16>) 159 %13:_(s32) = G_ANYEXT %16(s16) 160 %14:_(s32) = G_ANYEXT %17(s16) 161 %15:_(s32) = G_ANYEXT %18(s16) 162 $vgpr0 = COPY %13(s32) 163 $vgpr1 = COPY %14(s32) 164 $vgpr2 = COPY %15(s32) 165 SI_RETURN implicit $vgpr0, implicit $vgpr1, implicit $vgpr2 166 167... 168 169--- 170name: fma_v4f16 171body: | 172 bb.1: 173 liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4, $vgpr5, $vgpr6, $vgpr7, $vgpr8, $vgpr9, $vgpr10, $vgpr11 174 175 ; GFX7-LABEL: name: fma_v4f16 176 ; GFX7: liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4, $vgpr5, $vgpr6, $vgpr7, $vgpr8, $vgpr9, $vgpr10, $vgpr11 177 ; GFX7-NEXT: {{ $}} 178 ; GFX7-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 179 ; GFX7-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 180 ; GFX7-NEXT: [[COPY2:%[0-9]+]]:_(s32) = COPY $vgpr2 181 ; GFX7-NEXT: [[COPY3:%[0-9]+]]:_(s32) = COPY $vgpr3 182 ; GFX7-NEXT: [[COPY4:%[0-9]+]]:_(s32) = COPY $vgpr4 183 ; GFX7-NEXT: [[COPY5:%[0-9]+]]:_(s32) = COPY $vgpr5 184 ; GFX7-NEXT: [[COPY6:%[0-9]+]]:_(s32) = COPY $vgpr6 185 ; GFX7-NEXT: [[COPY7:%[0-9]+]]:_(s32) = COPY $vgpr7 186 ; GFX7-NEXT: [[COPY8:%[0-9]+]]:_(s32) = COPY $vgpr8 187 ; GFX7-NEXT: [[COPY9:%[0-9]+]]:_(s32) = COPY $vgpr9 188 ; GFX7-NEXT: [[COPY10:%[0-9]+]]:_(s32) = COPY $vgpr10 189 ; GFX7-NEXT: [[COPY11:%[0-9]+]]:_(s32) = COPY $vgpr11 190 ; GFX7-NEXT: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[COPY]](s32) 191 ; GFX7-NEXT: [[TRUNC1:%[0-9]+]]:_(s16) = G_TRUNC [[COPY1]](s32) 192 ; GFX7-NEXT: [[TRUNC2:%[0-9]+]]:_(s16) = G_TRUNC [[COPY2]](s32) 193 ; GFX7-NEXT: [[TRUNC3:%[0-9]+]]:_(s16) = G_TRUNC [[COPY3]](s32) 194 ; GFX7-NEXT: [[TRUNC4:%[0-9]+]]:_(s16) = G_TRUNC [[COPY4]](s32) 195 ; GFX7-NEXT: [[TRUNC5:%[0-9]+]]:_(s16) = G_TRUNC [[COPY5]](s32) 196 ; GFX7-NEXT: [[TRUNC6:%[0-9]+]]:_(s16) = G_TRUNC [[COPY6]](s32) 197 ; GFX7-NEXT: [[TRUNC7:%[0-9]+]]:_(s16) = G_TRUNC [[COPY7]](s32) 198 ; GFX7-NEXT: [[TRUNC8:%[0-9]+]]:_(s16) = G_TRUNC [[COPY8]](s32) 199 ; GFX7-NEXT: [[TRUNC9:%[0-9]+]]:_(s16) = G_TRUNC [[COPY9]](s32) 200 ; GFX7-NEXT: [[TRUNC10:%[0-9]+]]:_(s16) = G_TRUNC [[COPY10]](s32) 201 ; GFX7-NEXT: [[TRUNC11:%[0-9]+]]:_(s16) = G_TRUNC [[COPY11]](s32) 202 ; GFX7-NEXT: [[FPEXT:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC]](s16) 203 ; GFX7-NEXT: [[FPEXT1:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC4]](s16) 204 ; GFX7-NEXT: [[FPEXT2:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC8]](s16) 205 ; GFX7-NEXT: [[FMA:%[0-9]+]]:_(s32) = G_FMA [[FPEXT]], [[FPEXT1]], [[FPEXT2]] 206 ; GFX7-NEXT: [[FPTRUNC:%[0-9]+]]:_(s16) = G_FPTRUNC [[FMA]](s32) 207 ; GFX7-NEXT: [[FPEXT3:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC1]](s16) 208 ; GFX7-NEXT: [[FPEXT4:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC5]](s16) 209 ; GFX7-NEXT: [[FPEXT5:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC9]](s16) 210 ; GFX7-NEXT: [[FMA1:%[0-9]+]]:_(s32) = G_FMA [[FPEXT3]], [[FPEXT4]], [[FPEXT5]] 211 ; GFX7-NEXT: [[FPTRUNC1:%[0-9]+]]:_(s16) = G_FPTRUNC [[FMA1]](s32) 212 ; GFX7-NEXT: [[FPEXT6:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC2]](s16) 213 ; GFX7-NEXT: [[FPEXT7:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC6]](s16) 214 ; GFX7-NEXT: [[FPEXT8:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC10]](s16) 215 ; GFX7-NEXT: [[FMA2:%[0-9]+]]:_(s32) = G_FMA [[FPEXT6]], [[FPEXT7]], [[FPEXT8]] 216 ; GFX7-NEXT: [[FPTRUNC2:%[0-9]+]]:_(s16) = G_FPTRUNC [[FMA2]](s32) 217 ; GFX7-NEXT: [[FPEXT9:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC3]](s16) 218 ; GFX7-NEXT: [[FPEXT10:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC7]](s16) 219 ; GFX7-NEXT: [[FPEXT11:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC11]](s16) 220 ; GFX7-NEXT: [[FMA3:%[0-9]+]]:_(s32) = G_FMA [[FPEXT9]], [[FPEXT10]], [[FPEXT11]] 221 ; GFX7-NEXT: [[FPTRUNC3:%[0-9]+]]:_(s16) = G_FPTRUNC [[FMA3]](s32) 222 ; GFX7-NEXT: [[ANYEXT:%[0-9]+]]:_(s32) = G_ANYEXT [[FPTRUNC]](s16) 223 ; GFX7-NEXT: [[ANYEXT1:%[0-9]+]]:_(s32) = G_ANYEXT [[FPTRUNC1]](s16) 224 ; GFX7-NEXT: [[ANYEXT2:%[0-9]+]]:_(s32) = G_ANYEXT [[FPTRUNC2]](s16) 225 ; GFX7-NEXT: [[ANYEXT3:%[0-9]+]]:_(s32) = G_ANYEXT [[FPTRUNC3]](s16) 226 ; GFX7-NEXT: $vgpr0 = COPY [[ANYEXT]](s32) 227 ; GFX7-NEXT: $vgpr1 = COPY [[ANYEXT1]](s32) 228 ; GFX7-NEXT: $vgpr2 = COPY [[ANYEXT2]](s32) 229 ; GFX7-NEXT: $vgpr3 = COPY [[ANYEXT3]](s32) 230 ; GFX7-NEXT: SI_RETURN implicit $vgpr0, implicit $vgpr1, implicit $vgpr2, implicit $vgpr3 231 %4:_(s32) = COPY $vgpr0 232 %5:_(s32) = COPY $vgpr1 233 %6:_(s32) = COPY $vgpr2 234 %7:_(s32) = COPY $vgpr3 235 %8:_(<4 x s32>) = G_BUILD_VECTOR %4(s32), %5(s32), %6(s32), %7(s32) 236 %0:_(<4 x s16>) = G_TRUNC %8(<4 x s32>) 237 %9:_(s32) = COPY $vgpr4 238 %10:_(s32) = COPY $vgpr5 239 %11:_(s32) = COPY $vgpr6 240 %12:_(s32) = COPY $vgpr7 241 %13:_(<4 x s32>) = G_BUILD_VECTOR %9(s32), %10(s32), %11(s32), %12(s32) 242 %1:_(<4 x s16>) = G_TRUNC %13(<4 x s32>) 243 %14:_(s32) = COPY $vgpr8 244 %15:_(s32) = COPY $vgpr9 245 %16:_(s32) = COPY $vgpr10 246 %17:_(s32) = COPY $vgpr11 247 %18:_(<4 x s32>) = G_BUILD_VECTOR %14(s32), %15(s32), %16(s32), %17(s32) 248 %2:_(<4 x s16>) = G_TRUNC %18(<4 x s32>) 249 %19:_(<4 x s16>) = G_FMA %0, %1, %2 250 %25:_(s16), %26:_(s16), %27:_(s16), %28:_(s16) = G_UNMERGE_VALUES %19(<4 x s16>) 251 %21:_(s32) = G_ANYEXT %25(s16) 252 %22:_(s32) = G_ANYEXT %26(s16) 253 %23:_(s32) = G_ANYEXT %27(s16) 254 %24:_(s32) = G_ANYEXT %28(s16) 255 $vgpr0 = COPY %21(s32) 256 $vgpr1 = COPY %22(s32) 257 $vgpr2 = COPY %23(s32) 258 $vgpr3 = COPY %24(s32) 259 SI_RETURN implicit $vgpr0, implicit $vgpr1, implicit $vgpr2, implicit $vgpr3 260... 261 262--- 263name: maxnum_v5i16 264body: | 265 bb.1: 266 liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4, $vgpr5, $vgpr6, $vgpr7, $vgpr8, $vgpr9 267 268 ; GFX7-LABEL: name: maxnum_v5i16 269 ; GFX7: liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4, $vgpr5, $vgpr6, $vgpr7, $vgpr8, $vgpr9 270 ; GFX7-NEXT: {{ $}} 271 ; GFX7-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 272 ; GFX7-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 273 ; GFX7-NEXT: [[COPY2:%[0-9]+]]:_(s32) = COPY $vgpr2 274 ; GFX7-NEXT: [[COPY3:%[0-9]+]]:_(s32) = COPY $vgpr3 275 ; GFX7-NEXT: [[COPY4:%[0-9]+]]:_(s32) = COPY $vgpr4 276 ; GFX7-NEXT: [[COPY5:%[0-9]+]]:_(s32) = COPY $vgpr5 277 ; GFX7-NEXT: [[COPY6:%[0-9]+]]:_(s32) = COPY $vgpr6 278 ; GFX7-NEXT: [[COPY7:%[0-9]+]]:_(s32) = COPY $vgpr7 279 ; GFX7-NEXT: [[COPY8:%[0-9]+]]:_(s32) = COPY $vgpr8 280 ; GFX7-NEXT: [[COPY9:%[0-9]+]]:_(s32) = COPY $vgpr9 281 ; GFX7-NEXT: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[COPY]](s32) 282 ; GFX7-NEXT: [[TRUNC1:%[0-9]+]]:_(s16) = G_TRUNC [[COPY1]](s32) 283 ; GFX7-NEXT: [[TRUNC2:%[0-9]+]]:_(s16) = G_TRUNC [[COPY2]](s32) 284 ; GFX7-NEXT: [[TRUNC3:%[0-9]+]]:_(s16) = G_TRUNC [[COPY3]](s32) 285 ; GFX7-NEXT: [[TRUNC4:%[0-9]+]]:_(s16) = G_TRUNC [[COPY4]](s32) 286 ; GFX7-NEXT: [[TRUNC5:%[0-9]+]]:_(s16) = G_TRUNC [[COPY5]](s32) 287 ; GFX7-NEXT: [[TRUNC6:%[0-9]+]]:_(s16) = G_TRUNC [[COPY6]](s32) 288 ; GFX7-NEXT: [[TRUNC7:%[0-9]+]]:_(s16) = G_TRUNC [[COPY7]](s32) 289 ; GFX7-NEXT: [[TRUNC8:%[0-9]+]]:_(s16) = G_TRUNC [[COPY8]](s32) 290 ; GFX7-NEXT: [[TRUNC9:%[0-9]+]]:_(s16) = G_TRUNC [[COPY9]](s32) 291 ; GFX7-NEXT: [[FPEXT:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC]](s16) 292 ; GFX7-NEXT: [[FPEXT1:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC5]](s16) 293 ; GFX7-NEXT: [[FMAXNUM_IEEE:%[0-9]+]]:_(s32) = G_FMAXNUM_IEEE [[FPEXT]], [[FPEXT1]] 294 ; GFX7-NEXT: [[FPTRUNC:%[0-9]+]]:_(s16) = G_FPTRUNC [[FMAXNUM_IEEE]](s32) 295 ; GFX7-NEXT: [[FPEXT2:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC1]](s16) 296 ; GFX7-NEXT: [[FPEXT3:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC6]](s16) 297 ; GFX7-NEXT: [[FMAXNUM_IEEE1:%[0-9]+]]:_(s32) = G_FMAXNUM_IEEE [[FPEXT2]], [[FPEXT3]] 298 ; GFX7-NEXT: [[FPTRUNC1:%[0-9]+]]:_(s16) = G_FPTRUNC [[FMAXNUM_IEEE1]](s32) 299 ; GFX7-NEXT: [[FPEXT4:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC2]](s16) 300 ; GFX7-NEXT: [[FPEXT5:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC7]](s16) 301 ; GFX7-NEXT: [[FMAXNUM_IEEE2:%[0-9]+]]:_(s32) = G_FMAXNUM_IEEE [[FPEXT4]], [[FPEXT5]] 302 ; GFX7-NEXT: [[FPTRUNC2:%[0-9]+]]:_(s16) = G_FPTRUNC [[FMAXNUM_IEEE2]](s32) 303 ; GFX7-NEXT: [[FPEXT6:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC3]](s16) 304 ; GFX7-NEXT: [[FPEXT7:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC8]](s16) 305 ; GFX7-NEXT: [[FMAXNUM_IEEE3:%[0-9]+]]:_(s32) = G_FMAXNUM_IEEE [[FPEXT6]], [[FPEXT7]] 306 ; GFX7-NEXT: [[FPTRUNC3:%[0-9]+]]:_(s16) = G_FPTRUNC [[FMAXNUM_IEEE3]](s32) 307 ; GFX7-NEXT: [[FPEXT8:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC4]](s16) 308 ; GFX7-NEXT: [[FPEXT9:%[0-9]+]]:_(s32) = G_FPEXT [[TRUNC9]](s16) 309 ; GFX7-NEXT: [[FMAXNUM_IEEE4:%[0-9]+]]:_(s32) = G_FMAXNUM_IEEE [[FPEXT8]], [[FPEXT9]] 310 ; GFX7-NEXT: [[FPTRUNC4:%[0-9]+]]:_(s16) = G_FPTRUNC [[FMAXNUM_IEEE4]](s32) 311 ; GFX7-NEXT: [[ANYEXT:%[0-9]+]]:_(s32) = G_ANYEXT [[FPTRUNC]](s16) 312 ; GFX7-NEXT: [[ANYEXT1:%[0-9]+]]:_(s32) = G_ANYEXT [[FPTRUNC1]](s16) 313 ; GFX7-NEXT: [[ANYEXT2:%[0-9]+]]:_(s32) = G_ANYEXT [[FPTRUNC2]](s16) 314 ; GFX7-NEXT: [[ANYEXT3:%[0-9]+]]:_(s32) = G_ANYEXT [[FPTRUNC3]](s16) 315 ; GFX7-NEXT: [[ANYEXT4:%[0-9]+]]:_(s32) = G_ANYEXT [[FPTRUNC4]](s16) 316 ; GFX7-NEXT: $vgpr0 = COPY [[ANYEXT]](s32) 317 ; GFX7-NEXT: $vgpr1 = COPY [[ANYEXT1]](s32) 318 ; GFX7-NEXT: $vgpr2 = COPY [[ANYEXT2]](s32) 319 ; GFX7-NEXT: $vgpr3 = COPY [[ANYEXT3]](s32) 320 ; GFX7-NEXT: $vgpr4 = COPY [[ANYEXT4]](s32) 321 ; GFX7-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0, implicit $vgpr1, implicit $vgpr2, implicit $vgpr3, implicit $vgpr4 322 %2:_(s32) = COPY $vgpr0 323 %3:_(s32) = COPY $vgpr1 324 %4:_(s32) = COPY $vgpr2 325 %5:_(s32) = COPY $vgpr3 326 %6:_(s32) = COPY $vgpr4 327 %7:_(<5 x s32>) = G_BUILD_VECTOR %2(s32), %3(s32), %4(s32), %5(s32), %6(s32) 328 %0:_(<5 x s16>) = G_TRUNC %7(<5 x s32>) 329 %8:_(s32) = COPY $vgpr5 330 %9:_(s32) = COPY $vgpr6 331 %10:_(s32) = COPY $vgpr7 332 %11:_(s32) = COPY $vgpr8 333 %12:_(s32) = COPY $vgpr9 334 %13:_(<5 x s32>) = G_BUILD_VECTOR %8(s32), %9(s32), %10(s32), %11(s32), %12(s32) 335 %1:_(<5 x s16>) = G_TRUNC %13(<5 x s32>) 336 %15:_(<5 x s16>) = G_FMAXNUM %0, %1 337 %21:_(s16), %22:_(s16), %23:_(s16), %24:_(s16), %25:_(s16) = G_UNMERGE_VALUES %15(<5 x s16>) 338 %16:_(s32) = G_ANYEXT %21(s16) 339 %17:_(s32) = G_ANYEXT %22(s16) 340 %18:_(s32) = G_ANYEXT %23(s16) 341 %19:_(s32) = G_ANYEXT %24(s16) 342 %20:_(s32) = G_ANYEXT %25(s16) 343 $vgpr0 = COPY %16(s32) 344 $vgpr1 = COPY %17(s32) 345 $vgpr2 = COPY %18(s32) 346 $vgpr3 = COPY %19(s32) 347 $vgpr4 = COPY %20(s32) 348 SI_RETURN_TO_EPILOG implicit $vgpr0, implicit $vgpr1, implicit $vgpr2, implicit $vgpr3, implicit $vgpr4 349... 350