1 #include "ARMBaseInstrInfo.h" 2 #include "ARMSubtarget.h" 3 #include "ARMTargetMachine.h" 4 #include "llvm/Support/TargetRegistry.h" 5 #include "llvm/Support/TargetSelect.h" 6 #include "llvm/Target/TargetMachine.h" 7 #include "llvm/Target/TargetOptions.h" 8 9 #include "gtest/gtest.h" 10 11 using namespace llvm; 12 13 // Test for instructions that aren't immediately obviously valid within a 14 // tail-predicated loop. This should be marked up in their tablegen 15 // descriptions. Currently we, conservatively, disallow: 16 // - cross beat carries. 17 // - narrowing of results. 18 // - top/bottom operations. 19 // - complex operations. 20 // - horizontal operations. 21 // - byte swapping. 22 // - interleaved memory instructions. 23 // TODO: Add to this list once we can handle them safely. 24 TEST(MachineInstrValidTailPredication, IsCorrect) { 25 26 using namespace ARM; 27 28 auto IsValidTPOpcode = [](unsigned Opcode) { 29 switch (Opcode) { 30 default: 31 return false; 32 case MVE_ASRLi: 33 case MVE_ASRLr: 34 case MVE_LSRL: 35 case MVE_SQRSHR: 36 case MVE_SQSHL: 37 case MVE_SRSHR: 38 case MVE_UQRSHL: 39 case MVE_UQSHL: 40 case MVE_URSHR: 41 case MVE_VABDf16: 42 case MVE_VABDf32: 43 case MVE_VABDs16: 44 case MVE_VABDs32: 45 case MVE_VABDs8: 46 case MVE_VABDu16: 47 case MVE_VABDu32: 48 case MVE_VABDu8: 49 case MVE_VABSf16: 50 case MVE_VABSf32: 51 case MVE_VABSs16: 52 case MVE_VABSs32: 53 case MVE_VABSs8: 54 case MVE_VADD_qr_f16: 55 case MVE_VADD_qr_f32: 56 case MVE_VADD_qr_i16: 57 case MVE_VADD_qr_i32: 58 case MVE_VADD_qr_i8: 59 case MVE_VADDf16: 60 case MVE_VADDf32: 61 case MVE_VADDi16: 62 case MVE_VADDi32: 63 case MVE_VADDi8: 64 case MVE_VAND: 65 case MVE_VBIC: 66 case MVE_VBICIZ0v4i32: 67 case MVE_VBICIZ0v8i16: 68 case MVE_VBICIZ16v4i32: 69 case MVE_VBICIZ24v4i32: 70 case MVE_VBICIZ8v4i32: 71 case MVE_VBICIZ8v8i16: 72 case MVE_VBRSR16: 73 case MVE_VBRSR32: 74 case MVE_VBRSR8: 75 case MVE_VCLSs16: 76 case MVE_VCLSs32: 77 case MVE_VCLSs8: 78 case MVE_VCLZs16: 79 case MVE_VCLZs32: 80 case MVE_VCLZs8: 81 case MVE_VCMPf16: 82 case MVE_VCMPf16r: 83 case MVE_VCMPf32: 84 case MVE_VCMPf32r: 85 case MVE_VCMPi16: 86 case MVE_VCMPi16r: 87 case MVE_VCMPi32: 88 case MVE_VCMPi32r: 89 case MVE_VCMPi8: 90 case MVE_VCMPi8r: 91 case MVE_VCMPs16: 92 case MVE_VCMPs16r: 93 case MVE_VCMPs32: 94 case MVE_VCMPs32r: 95 case MVE_VCMPs8: 96 case MVE_VCMPs8r: 97 case MVE_VCMPu16: 98 case MVE_VCMPu16r: 99 case MVE_VCMPu32: 100 case MVE_VCMPu32r: 101 case MVE_VCMPu8: 102 case MVE_VCMPu8r: 103 case MVE_VCTP16: 104 case MVE_VCTP32: 105 case MVE_VCTP64: 106 case MVE_VCTP8: 107 case MVE_VCVTf16s16_fix: 108 case MVE_VCVTf16s16n: 109 case MVE_VCVTf16u16_fix: 110 case MVE_VCVTf16u16n: 111 case MVE_VCVTf32s32_fix: 112 case MVE_VCVTf32s32n: 113 case MVE_VCVTf32u32_fix: 114 case MVE_VCVTf32u32n: 115 case MVE_VCVTs16f16_fix: 116 case MVE_VCVTs16f16a: 117 case MVE_VCVTs16f16m: 118 case MVE_VCVTs16f16n: 119 case MVE_VCVTs16f16p: 120 case MVE_VCVTs16f16z: 121 case MVE_VCVTs32f32_fix: 122 case MVE_VCVTs32f32a: 123 case MVE_VCVTs32f32m: 124 case MVE_VCVTs32f32n: 125 case MVE_VCVTs32f32p: 126 case MVE_VCVTs32f32z: 127 case MVE_VCVTu16f16_fix: 128 case MVE_VCVTu16f16a: 129 case MVE_VCVTu16f16m: 130 case MVE_VCVTu16f16n: 131 case MVE_VCVTu16f16p: 132 case MVE_VCVTu16f16z: 133 case MVE_VCVTu32f32_fix: 134 case MVE_VCVTu32f32a: 135 case MVE_VCVTu32f32m: 136 case MVE_VCVTu32f32n: 137 case MVE_VCVTu32f32p: 138 case MVE_VCVTu32f32z: 139 case MVE_VDDUPu16: 140 case MVE_VDDUPu32: 141 case MVE_VDDUPu8: 142 case MVE_VDUP16: 143 case MVE_VDUP32: 144 case MVE_VDUP8: 145 case MVE_VDWDUPu16: 146 case MVE_VDWDUPu32: 147 case MVE_VDWDUPu8: 148 case MVE_VEOR: 149 case MVE_VFMA_qr_Sf16: 150 case MVE_VFMA_qr_Sf32: 151 case MVE_VFMA_qr_f16: 152 case MVE_VFMA_qr_f32: 153 case MVE_VMLAS_qr_s16: 154 case MVE_VMLAS_qr_s32: 155 case MVE_VMLAS_qr_s8: 156 case MVE_VMLAS_qr_u16: 157 case MVE_VMLAS_qr_u32: 158 case MVE_VMLAS_qr_u8: 159 case MVE_VMLA_qr_s16: 160 case MVE_VMLA_qr_s32: 161 case MVE_VMLA_qr_s8: 162 case MVE_VMLA_qr_u16: 163 case MVE_VMLA_qr_u32: 164 case MVE_VMLA_qr_u8: 165 case MVE_VHADD_qr_s16: 166 case MVE_VHADD_qr_s32: 167 case MVE_VHADD_qr_s8: 168 case MVE_VHADD_qr_u16: 169 case MVE_VHADD_qr_u32: 170 case MVE_VHADD_qr_u8: 171 case MVE_VHADDs16: 172 case MVE_VHADDs32: 173 case MVE_VHADDs8: 174 case MVE_VHADDu16: 175 case MVE_VHADDu32: 176 case MVE_VHADDu8: 177 case MVE_VHSUB_qr_s16: 178 case MVE_VHSUB_qr_s32: 179 case MVE_VHSUB_qr_s8: 180 case MVE_VHSUB_qr_u16: 181 case MVE_VHSUB_qr_u32: 182 case MVE_VHSUB_qr_u8: 183 case MVE_VHSUBs16: 184 case MVE_VHSUBs32: 185 case MVE_VHSUBs8: 186 case MVE_VHSUBu16: 187 case MVE_VHSUBu32: 188 case MVE_VHSUBu8: 189 case MVE_VIDUPu16: 190 case MVE_VIDUPu32: 191 case MVE_VIDUPu8: 192 case MVE_VIWDUPu16: 193 case MVE_VIWDUPu32: 194 case MVE_VIWDUPu8: 195 case MVE_VLDRBS16: 196 case MVE_VLDRBS16_post: 197 case MVE_VLDRBS16_pre: 198 case MVE_VLDRBS16_rq: 199 case MVE_VLDRBS32: 200 case MVE_VLDRBS32_post: 201 case MVE_VLDRBS32_pre: 202 case MVE_VLDRBS32_rq: 203 case MVE_VLDRBU16: 204 case MVE_VLDRBU16_post: 205 case MVE_VLDRBU16_pre: 206 case MVE_VLDRBU16_rq: 207 case MVE_VLDRBU32: 208 case MVE_VLDRBU32_post: 209 case MVE_VLDRBU32_pre: 210 case MVE_VLDRBU32_rq: 211 case MVE_VLDRBU8: 212 case MVE_VLDRBU8_post: 213 case MVE_VLDRBU8_pre: 214 case MVE_VLDRBU8_rq: 215 case MVE_VLDRDU64_qi: 216 case MVE_VLDRDU64_qi_pre: 217 case MVE_VLDRDU64_rq: 218 case MVE_VLDRDU64_rq_u: 219 case MVE_VLDRHS32: 220 case MVE_VLDRHS32_post: 221 case MVE_VLDRHS32_pre: 222 case MVE_VLDRHS32_rq: 223 case MVE_VLDRHS32_rq_u: 224 case MVE_VLDRHU16: 225 case MVE_VLDRHU16_post: 226 case MVE_VLDRHU16_pre: 227 case MVE_VLDRHU16_rq: 228 case MVE_VLDRHU16_rq_u: 229 case MVE_VLDRHU32: 230 case MVE_VLDRHU32_post: 231 case MVE_VLDRHU32_pre: 232 case MVE_VLDRHU32_rq: 233 case MVE_VLDRHU32_rq_u: 234 case MVE_VLDRWU32: 235 case MVE_VLDRWU32_post: 236 case MVE_VLDRWU32_pre: 237 case MVE_VLDRWU32_qi: 238 case MVE_VLDRWU32_qi_pre: 239 case MVE_VLDRWU32_rq: 240 case MVE_VLDRWU32_rq_u: 241 case MVE_VMOVimmf32: 242 case MVE_VMOVimmi16: 243 case MVE_VMOVimmi32: 244 case MVE_VMOVimmi64: 245 case MVE_VMOVimmi8: 246 case MVE_VMUL_qr_f16: 247 case MVE_VMUL_qr_f32: 248 case MVE_VMUL_qr_i16: 249 case MVE_VMUL_qr_i32: 250 case MVE_VMUL_qr_i8: 251 case MVE_VMULf16: 252 case MVE_VMULf32: 253 case MVE_VMVN: 254 case MVE_VMVNimmi16: 255 case MVE_VMVNimmi32: 256 case MVE_VNEGf16: 257 case MVE_VNEGf32: 258 case MVE_VNEGs16: 259 case MVE_VNEGs32: 260 case MVE_VNEGs8: 261 case MVE_VORN: 262 case MVE_VORR: 263 case MVE_VORRIZ0v4i32: 264 case MVE_VORRIZ0v8i16: 265 case MVE_VORRIZ16v4i32: 266 case MVE_VORRIZ24v4i32: 267 case MVE_VORRIZ8v4i32: 268 case MVE_VORRIZ8v8i16: 269 case MVE_VPNOT: 270 case MVE_VPSEL: 271 case MVE_VPST: 272 case MVE_VPTv16i8: 273 case MVE_VPTv16i8r: 274 case MVE_VPTv16s8: 275 case MVE_VPTv16s8r: 276 case MVE_VPTv16u8: 277 case MVE_VPTv16u8r: 278 case MVE_VPTv4f32: 279 case MVE_VPTv4f32r: 280 case MVE_VPTv4i32: 281 case MVE_VPTv4i32r: 282 case MVE_VPTv4s32: 283 case MVE_VPTv4s32r: 284 case MVE_VPTv4u32: 285 case MVE_VPTv4u32r: 286 case MVE_VPTv8f16: 287 case MVE_VPTv8f16r: 288 case MVE_VPTv8i16: 289 case MVE_VPTv8i16r: 290 case MVE_VPTv8s16: 291 case MVE_VPTv8s16r: 292 case MVE_VPTv8u16: 293 case MVE_VPTv8u16r: 294 case MVE_VQABSs16: 295 case MVE_VQABSs32: 296 case MVE_VQABSs8: 297 case MVE_VQADD_qr_s16: 298 case MVE_VQADD_qr_s32: 299 case MVE_VQADD_qr_s8: 300 case MVE_VQADD_qr_u16: 301 case MVE_VQADD_qr_u32: 302 case MVE_VQADD_qr_u8: 303 case MVE_VQADDs16: 304 case MVE_VQADDs32: 305 case MVE_VQADDs8: 306 case MVE_VQADDu16: 307 case MVE_VQADDu32: 308 case MVE_VQADDu8: 309 case MVE_VQNEGs16: 310 case MVE_VQNEGs32: 311 case MVE_VQNEGs8: 312 case MVE_VQRSHL_by_vecs16: 313 case MVE_VQRSHL_by_vecs32: 314 case MVE_VQRSHL_by_vecs8: 315 case MVE_VQRSHL_by_vecu16: 316 case MVE_VQRSHL_by_vecu32: 317 case MVE_VQRSHL_by_vecu8: 318 case MVE_VQRSHL_qrs16: 319 case MVE_VQRSHL_qrs32: 320 case MVE_VQRSHL_qrs8: 321 case MVE_VQRSHL_qru16: 322 case MVE_VQRSHL_qru8: 323 case MVE_VQRSHL_qru32: 324 case MVE_VQSHLU_imms16: 325 case MVE_VQSHLU_imms32: 326 case MVE_VQSHLU_imms8: 327 case MVE_VQSHL_by_vecs16: 328 case MVE_VQSHL_by_vecs32: 329 case MVE_VQSHL_by_vecs8: 330 case MVE_VQSHL_by_vecu16: 331 case MVE_VQSHL_by_vecu32: 332 case MVE_VQSHL_by_vecu8: 333 case MVE_VQSHL_qrs16: 334 case MVE_VQSHL_qrs32: 335 case MVE_VQSHL_qrs8: 336 case MVE_VQSHL_qru16: 337 case MVE_VQSHL_qru32: 338 case MVE_VQSHL_qru8: 339 case MVE_VQSUB_qr_s16: 340 case MVE_VQSUB_qr_s32: 341 case MVE_VQSUB_qr_s8: 342 case MVE_VQSUB_qr_u16: 343 case MVE_VQSUB_qr_u32: 344 case MVE_VQSUB_qr_u8: 345 case MVE_VQSUBs16: 346 case MVE_VQSUBs32: 347 case MVE_VQSUBs8: 348 case MVE_VQSUBu16: 349 case MVE_VQSUBu32: 350 case MVE_VQSUBu8: 351 case MVE_VRHADDs16: 352 case MVE_VRHADDs32: 353 case MVE_VRHADDs8: 354 case MVE_VRHADDu16: 355 case MVE_VRHADDu32: 356 case MVE_VRHADDu8: 357 case MVE_VRINTf16A: 358 case MVE_VRINTf16M: 359 case MVE_VRINTf16N: 360 case MVE_VRINTf16P: 361 case MVE_VRINTf16X: 362 case MVE_VRINTf16Z: 363 case MVE_VRINTf32A: 364 case MVE_VRINTf32M: 365 case MVE_VRINTf32N: 366 case MVE_VRINTf32P: 367 case MVE_VRINTf32X: 368 case MVE_VRINTf32Z: 369 case MVE_VRSHL_by_vecs16: 370 case MVE_VRSHL_by_vecs32: 371 case MVE_VRSHL_by_vecs8: 372 case MVE_VRSHL_by_vecu16: 373 case MVE_VRSHL_by_vecu32: 374 case MVE_VRSHL_by_vecu8: 375 case MVE_VRSHL_qrs16: 376 case MVE_VRSHL_qrs32: 377 case MVE_VRSHL_qrs8: 378 case MVE_VRSHL_qru16: 379 case MVE_VRSHL_qru32: 380 case MVE_VRSHL_qru8: 381 case MVE_VRSHR_imms16: 382 case MVE_VRSHR_imms32: 383 case MVE_VRSHR_imms8: 384 case MVE_VRSHR_immu16: 385 case MVE_VRSHR_immu32: 386 case MVE_VRSHR_immu8: 387 case MVE_VSHL_by_vecs16: 388 case MVE_VSHL_by_vecs32: 389 case MVE_VSHL_by_vecs8: 390 case MVE_VSHL_by_vecu16: 391 case MVE_VSHL_by_vecu32: 392 case MVE_VSHL_by_vecu8: 393 case MVE_VSHL_immi16: 394 case MVE_VSHL_immi32: 395 case MVE_VSHL_immi8: 396 case MVE_VSHL_qrs16: 397 case MVE_VSHL_qrs32: 398 case MVE_VSHL_qrs8: 399 case MVE_VSHL_qru16: 400 case MVE_VSHL_qru32: 401 case MVE_VSHL_qru8: 402 case MVE_VSHR_imms16: 403 case MVE_VSHR_imms32: 404 case MVE_VSHR_imms8: 405 case MVE_VSHR_immu16: 406 case MVE_VSHR_immu32: 407 case MVE_VSHR_immu8: 408 case MVE_VSLIimm16: 409 case MVE_VSLIimm32: 410 case MVE_VSLIimm8: 411 case MVE_VSLIimms16: 412 case MVE_VSLIimms32: 413 case MVE_VSLIimms8: 414 case MVE_VSLIimmu16: 415 case MVE_VSLIimmu32: 416 case MVE_VSLIimmu8: 417 case MVE_VSRIimm16: 418 case MVE_VSRIimm32: 419 case MVE_VSRIimm8: 420 case MVE_VSTRB16: 421 case MVE_VSTRB16_post: 422 case MVE_VSTRB16_pre: 423 case MVE_VSTRB16_rq: 424 case MVE_VSTRB32: 425 case MVE_VSTRB32_post: 426 case MVE_VSTRB32_pre: 427 case MVE_VSTRB32_rq: 428 case MVE_VSTRB8_rq: 429 case MVE_VSTRBU8: 430 case MVE_VSTRBU8_post: 431 case MVE_VSTRBU8_pre: 432 case MVE_VSTRD64_qi: 433 case MVE_VSTRD64_qi_pre: 434 case MVE_VSTRD64_rq: 435 case MVE_VSTRD64_rq_u: 436 case MVE_VSTRH16_rq: 437 case MVE_VSTRH16_rq_u: 438 case MVE_VSTRH32: 439 case MVE_VSTRH32_post: 440 case MVE_VSTRH32_pre: 441 case MVE_VSTRH32_rq: 442 case MVE_VSTRH32_rq_u: 443 case MVE_VSTRHU16: 444 case MVE_VSTRHU16_post: 445 case MVE_VSTRHU16_pre: 446 case MVE_VSTRW32_qi: 447 case MVE_VSTRW32_qi_pre: 448 case MVE_VSTRW32_rq: 449 case MVE_VSTRW32_rq_u: 450 case MVE_VSTRWU32: 451 case MVE_VSTRWU32_post: 452 case MVE_VSTRWU32_pre: 453 case MVE_VSUB_qr_f16: 454 case MVE_VSUB_qr_f32: 455 case MVE_VSUB_qr_i16: 456 case MVE_VSUB_qr_i32: 457 case MVE_VSUB_qr_i8: 458 case MVE_VSUBf16: 459 case MVE_VSUBf32: 460 case MVE_VSUBi16: 461 case MVE_VSUBi32: 462 case MVE_VSUBi8: 463 return true; 464 } 465 }; 466 467 LLVMInitializeARMTargetInfo(); 468 LLVMInitializeARMTarget(); 469 LLVMInitializeARMTargetMC(); 470 471 auto TT(Triple::normalize("thumbv8.1m.main-arm-none-eabi")); 472 std::string Error; 473 const Target *T = TargetRegistry::lookupTarget(TT, Error); 474 if (!T) { 475 dbgs() << Error; 476 return; 477 } 478 479 TargetOptions Options; 480 auto TM = std::unique_ptr<LLVMTargetMachine>( 481 static_cast<LLVMTargetMachine*>( 482 T->createTargetMachine(TT, "generic", "", Options, None, None, 483 CodeGenOpt::Default))); 484 ARMSubtarget ST(TM->getTargetTriple(), TM->getTargetCPU(), 485 TM->getTargetFeatureString(), 486 *static_cast<const ARMBaseTargetMachine*>(TM.get()), false); 487 const ARMBaseInstrInfo *TII = ST.getInstrInfo(); 488 auto MII = TM->getMCInstrInfo(); 489 490 for (unsigned i = 0; i < ARM::INSTRUCTION_LIST_END; ++i) { 491 const MCInstrDesc &Desc = TII->get(i); 492 493 for (auto &Op : Desc.operands()) { 494 // Only check instructions that access the MQPR regs. 495 if ((Op.OperandType & MCOI::OPERAND_REGISTER) == 0 || 496 Op.RegClass != ARM::MQPRRegClassID) 497 continue; 498 499 uint64_t Flags = MII->get(i).TSFlags; 500 bool Valid = (Flags & ARMII::ValidForTailPredication) != 0; 501 ASSERT_EQ(IsValidTPOpcode(i), Valid) 502 << MII->getName(i) 503 << ": mismatched expectation for tail-predicated safety\n"; 504 break; 505 } 506 } 507 } 508