xref: /llvm-project/llvm/unittests/Target/ARM/MachineInstrTest.cpp (revision ce39278f2575cc0b6481924e02a0fd8632b74aa8)
1 #include "ARMBaseInstrInfo.h"
2 #include "ARMSubtarget.h"
3 #include "ARMTargetMachine.h"
4 #include "llvm/Support/TargetRegistry.h"
5 #include "llvm/Support/TargetSelect.h"
6 #include "llvm/Target/TargetMachine.h"
7 #include "llvm/Target/TargetOptions.h"
8 
9 #include "gtest/gtest.h"
10 
11 using namespace llvm;
12 
13 // Test for instructions that aren't immediately obviously valid within a
14 // tail-predicated loop. This should be marked up in their tablegen
15 // descriptions. Currently we, conservatively, disallow:
16 // - cross beat carries.
17 // - narrowing of results.
18 // - top/bottom operations.
19 // - complex operations.
20 // - horizontal operations.
21 // - byte swapping.
22 // - interleaved memory instructions.
23 // TODO: Add to this list once we can handle them safely.
24 TEST(MachineInstrValidTailPredication, IsCorrect) {
25 
26   using namespace ARM;
27 
28   auto IsValidTPOpcode = [](unsigned Opcode) {
29     switch (Opcode) {
30     default:
31       return false;
32     case MVE_ASRLi:
33     case MVE_ASRLr:
34     case MVE_LSRL:
35     case MVE_SQRSHR:
36     case MVE_SQSHL:
37     case MVE_SRSHR:
38     case MVE_UQRSHL:
39     case MVE_UQSHL:
40     case MVE_URSHR:
41     case MVE_VABDf16:
42     case MVE_VABDf32:
43     case MVE_VABDs16:
44     case MVE_VABDs32:
45     case MVE_VABDs8:
46     case MVE_VABDu16:
47     case MVE_VABDu32:
48     case MVE_VABDu8:
49     case MVE_VABSf16:
50     case MVE_VABSf32:
51     case MVE_VABSs16:
52     case MVE_VABSs32:
53     case MVE_VABSs8:
54     case MVE_VADD_qr_f16:
55     case MVE_VADD_qr_f32:
56     case MVE_VADD_qr_i16:
57     case MVE_VADD_qr_i32:
58     case MVE_VADD_qr_i8:
59     case MVE_VADDf16:
60     case MVE_VADDf32:
61     case MVE_VADDi16:
62     case MVE_VADDi32:
63     case MVE_VADDi8:
64     case MVE_VAND:
65     case MVE_VBIC:
66     case MVE_VBICIZ0v4i32:
67     case MVE_VBICIZ0v8i16:
68     case MVE_VBICIZ16v4i32:
69     case MVE_VBICIZ24v4i32:
70     case MVE_VBICIZ8v4i32:
71     case MVE_VBICIZ8v8i16:
72     case MVE_VBRSR16:
73     case MVE_VBRSR32:
74     case MVE_VBRSR8:
75     case MVE_VCLSs16:
76     case MVE_VCLSs32:
77     case MVE_VCLSs8:
78     case MVE_VCLZs16:
79     case MVE_VCLZs32:
80     case MVE_VCLZs8:
81     case MVE_VCMPf16:
82     case MVE_VCMPf16r:
83     case MVE_VCMPf32:
84     case MVE_VCMPf32r:
85     case MVE_VCMPi16:
86     case MVE_VCMPi16r:
87     case MVE_VCMPi32:
88     case MVE_VCMPi32r:
89     case MVE_VCMPi8:
90     case MVE_VCMPi8r:
91     case MVE_VCMPs16:
92     case MVE_VCMPs16r:
93     case MVE_VCMPs32:
94     case MVE_VCMPs32r:
95     case MVE_VCMPs8:
96     case MVE_VCMPs8r:
97     case MVE_VCMPu16:
98     case MVE_VCMPu16r:
99     case MVE_VCMPu32:
100     case MVE_VCMPu32r:
101     case MVE_VCMPu8:
102     case MVE_VCMPu8r:
103     case MVE_VCTP16:
104     case MVE_VCTP32:
105     case MVE_VCTP64:
106     case MVE_VCTP8:
107     case MVE_VCVTf16s16_fix:
108     case MVE_VCVTf16s16n:
109     case MVE_VCVTf16u16_fix:
110     case MVE_VCVTf16u16n:
111     case MVE_VCVTf32s32_fix:
112     case MVE_VCVTf32s32n:
113     case MVE_VCVTf32u32_fix:
114     case MVE_VCVTf32u32n:
115     case MVE_VCVTs16f16_fix:
116     case MVE_VCVTs16f16a:
117     case MVE_VCVTs16f16m:
118     case MVE_VCVTs16f16n:
119     case MVE_VCVTs16f16p:
120     case MVE_VCVTs16f16z:
121     case MVE_VCVTs32f32_fix:
122     case MVE_VCVTs32f32a:
123     case MVE_VCVTs32f32m:
124     case MVE_VCVTs32f32n:
125     case MVE_VCVTs32f32p:
126     case MVE_VCVTs32f32z:
127     case MVE_VCVTu16f16_fix:
128     case MVE_VCVTu16f16a:
129     case MVE_VCVTu16f16m:
130     case MVE_VCVTu16f16n:
131     case MVE_VCVTu16f16p:
132     case MVE_VCVTu16f16z:
133     case MVE_VCVTu32f32_fix:
134     case MVE_VCVTu32f32a:
135     case MVE_VCVTu32f32m:
136     case MVE_VCVTu32f32n:
137     case MVE_VCVTu32f32p:
138     case MVE_VCVTu32f32z:
139     case MVE_VDDUPu16:
140     case MVE_VDDUPu32:
141     case MVE_VDDUPu8:
142     case MVE_VDUP16:
143     case MVE_VDUP32:
144     case MVE_VDUP8:
145     case MVE_VDWDUPu16:
146     case MVE_VDWDUPu32:
147     case MVE_VDWDUPu8:
148     case MVE_VEOR:
149     case MVE_VFMA_qr_Sf16:
150     case MVE_VFMA_qr_Sf32:
151     case MVE_VFMA_qr_f16:
152     case MVE_VFMA_qr_f32:
153     case MVE_VMLAS_qr_s16:
154     case MVE_VMLAS_qr_s32:
155     case MVE_VMLAS_qr_s8:
156     case MVE_VMLAS_qr_u16:
157     case MVE_VMLAS_qr_u32:
158     case MVE_VMLAS_qr_u8:
159     case MVE_VMLA_qr_s16:
160     case MVE_VMLA_qr_s32:
161     case MVE_VMLA_qr_s8:
162     case MVE_VMLA_qr_u16:
163     case MVE_VMLA_qr_u32:
164     case MVE_VMLA_qr_u8:
165     case MVE_VHADD_qr_s16:
166     case MVE_VHADD_qr_s32:
167     case MVE_VHADD_qr_s8:
168     case MVE_VHADD_qr_u16:
169     case MVE_VHADD_qr_u32:
170     case MVE_VHADD_qr_u8:
171     case MVE_VHADDs16:
172     case MVE_VHADDs32:
173     case MVE_VHADDs8:
174     case MVE_VHADDu16:
175     case MVE_VHADDu32:
176     case MVE_VHADDu8:
177     case MVE_VHSUB_qr_s16:
178     case MVE_VHSUB_qr_s32:
179     case MVE_VHSUB_qr_s8:
180     case MVE_VHSUB_qr_u16:
181     case MVE_VHSUB_qr_u32:
182     case MVE_VHSUB_qr_u8:
183     case MVE_VHSUBs16:
184     case MVE_VHSUBs32:
185     case MVE_VHSUBs8:
186     case MVE_VHSUBu16:
187     case MVE_VHSUBu32:
188     case MVE_VHSUBu8:
189     case MVE_VIDUPu16:
190     case MVE_VIDUPu32:
191     case MVE_VIDUPu8:
192     case MVE_VIWDUPu16:
193     case MVE_VIWDUPu32:
194     case MVE_VIWDUPu8:
195     case MVE_VLDRBS16:
196     case MVE_VLDRBS16_post:
197     case MVE_VLDRBS16_pre:
198     case MVE_VLDRBS16_rq:
199     case MVE_VLDRBS32:
200     case MVE_VLDRBS32_post:
201     case MVE_VLDRBS32_pre:
202     case MVE_VLDRBS32_rq:
203     case MVE_VLDRBU16:
204     case MVE_VLDRBU16_post:
205     case MVE_VLDRBU16_pre:
206     case MVE_VLDRBU16_rq:
207     case MVE_VLDRBU32:
208     case MVE_VLDRBU32_post:
209     case MVE_VLDRBU32_pre:
210     case MVE_VLDRBU32_rq:
211     case MVE_VLDRBU8:
212     case MVE_VLDRBU8_post:
213     case MVE_VLDRBU8_pre:
214     case MVE_VLDRBU8_rq:
215     case MVE_VLDRDU64_qi:
216     case MVE_VLDRDU64_qi_pre:
217     case MVE_VLDRDU64_rq:
218     case MVE_VLDRDU64_rq_u:
219     case MVE_VLDRHS32:
220     case MVE_VLDRHS32_post:
221     case MVE_VLDRHS32_pre:
222     case MVE_VLDRHS32_rq:
223     case MVE_VLDRHS32_rq_u:
224     case MVE_VLDRHU16:
225     case MVE_VLDRHU16_post:
226     case MVE_VLDRHU16_pre:
227     case MVE_VLDRHU16_rq:
228     case MVE_VLDRHU16_rq_u:
229     case MVE_VLDRHU32:
230     case MVE_VLDRHU32_post:
231     case MVE_VLDRHU32_pre:
232     case MVE_VLDRHU32_rq:
233     case MVE_VLDRHU32_rq_u:
234     case MVE_VLDRWU32:
235     case MVE_VLDRWU32_post:
236     case MVE_VLDRWU32_pre:
237     case MVE_VLDRWU32_qi:
238     case MVE_VLDRWU32_qi_pre:
239     case MVE_VLDRWU32_rq:
240     case MVE_VLDRWU32_rq_u:
241     case MVE_VMOVimmf32:
242     case MVE_VMOVimmi16:
243     case MVE_VMOVimmi32:
244     case MVE_VMOVimmi64:
245     case MVE_VMOVimmi8:
246     case MVE_VMUL_qr_f16:
247     case MVE_VMUL_qr_f32:
248     case MVE_VMUL_qr_i16:
249     case MVE_VMUL_qr_i32:
250     case MVE_VMUL_qr_i8:
251     case MVE_VMULf16:
252     case MVE_VMULf32:
253     case MVE_VMVN:
254     case MVE_VMVNimmi16:
255     case MVE_VMVNimmi32:
256     case MVE_VNEGf16:
257     case MVE_VNEGf32:
258     case MVE_VNEGs16:
259     case MVE_VNEGs32:
260     case MVE_VNEGs8:
261     case MVE_VORN:
262     case MVE_VORR:
263     case MVE_VORRIZ0v4i32:
264     case MVE_VORRIZ0v8i16:
265     case MVE_VORRIZ16v4i32:
266     case MVE_VORRIZ24v4i32:
267     case MVE_VORRIZ8v4i32:
268     case MVE_VORRIZ8v8i16:
269     case MVE_VPNOT:
270     case MVE_VPSEL:
271     case MVE_VPST:
272     case MVE_VPTv16i8:
273     case MVE_VPTv16i8r:
274     case MVE_VPTv16s8:
275     case MVE_VPTv16s8r:
276     case MVE_VPTv16u8:
277     case MVE_VPTv16u8r:
278     case MVE_VPTv4f32:
279     case MVE_VPTv4f32r:
280     case MVE_VPTv4i32:
281     case MVE_VPTv4i32r:
282     case MVE_VPTv4s32:
283     case MVE_VPTv4s32r:
284     case MVE_VPTv4u32:
285     case MVE_VPTv4u32r:
286     case MVE_VPTv8f16:
287     case MVE_VPTv8f16r:
288     case MVE_VPTv8i16:
289     case MVE_VPTv8i16r:
290     case MVE_VPTv8s16:
291     case MVE_VPTv8s16r:
292     case MVE_VPTv8u16:
293     case MVE_VPTv8u16r:
294     case MVE_VQABSs16:
295     case MVE_VQABSs32:
296     case MVE_VQABSs8:
297     case MVE_VQADD_qr_s16:
298     case MVE_VQADD_qr_s32:
299     case MVE_VQADD_qr_s8:
300     case MVE_VQADD_qr_u16:
301     case MVE_VQADD_qr_u32:
302     case MVE_VQADD_qr_u8:
303     case MVE_VQADDs16:
304     case MVE_VQADDs32:
305     case MVE_VQADDs8:
306     case MVE_VQADDu16:
307     case MVE_VQADDu32:
308     case MVE_VQADDu8:
309     case MVE_VQNEGs16:
310     case MVE_VQNEGs32:
311     case MVE_VQNEGs8:
312     case MVE_VQRSHL_by_vecs16:
313     case MVE_VQRSHL_by_vecs32:
314     case MVE_VQRSHL_by_vecs8:
315     case MVE_VQRSHL_by_vecu16:
316     case MVE_VQRSHL_by_vecu32:
317     case MVE_VQRSHL_by_vecu8:
318     case MVE_VQRSHL_qrs16:
319     case MVE_VQRSHL_qrs32:
320     case MVE_VQRSHL_qrs8:
321     case MVE_VQRSHL_qru16:
322     case MVE_VQRSHL_qru8:
323     case MVE_VQRSHL_qru32:
324     case MVE_VQSHLU_imms16:
325     case MVE_VQSHLU_imms32:
326     case MVE_VQSHLU_imms8:
327     case MVE_VQSHL_by_vecs16:
328     case MVE_VQSHL_by_vecs32:
329     case MVE_VQSHL_by_vecs8:
330     case MVE_VQSHL_by_vecu16:
331     case MVE_VQSHL_by_vecu32:
332     case MVE_VQSHL_by_vecu8:
333     case MVE_VQSHL_qrs16:
334     case MVE_VQSHL_qrs32:
335     case MVE_VQSHL_qrs8:
336     case MVE_VQSHL_qru16:
337     case MVE_VQSHL_qru32:
338     case MVE_VQSHL_qru8:
339     case MVE_VQSUB_qr_s16:
340     case MVE_VQSUB_qr_s32:
341     case MVE_VQSUB_qr_s8:
342     case MVE_VQSUB_qr_u16:
343     case MVE_VQSUB_qr_u32:
344     case MVE_VQSUB_qr_u8:
345     case MVE_VQSUBs16:
346     case MVE_VQSUBs32:
347     case MVE_VQSUBs8:
348     case MVE_VQSUBu16:
349     case MVE_VQSUBu32:
350     case MVE_VQSUBu8:
351     case MVE_VRHADDs16:
352     case MVE_VRHADDs32:
353     case MVE_VRHADDs8:
354     case MVE_VRHADDu16:
355     case MVE_VRHADDu32:
356     case MVE_VRHADDu8:
357     case MVE_VRINTf16A:
358     case MVE_VRINTf16M:
359     case MVE_VRINTf16N:
360     case MVE_VRINTf16P:
361     case MVE_VRINTf16X:
362     case MVE_VRINTf16Z:
363     case MVE_VRINTf32A:
364     case MVE_VRINTf32M:
365     case MVE_VRINTf32N:
366     case MVE_VRINTf32P:
367     case MVE_VRINTf32X:
368     case MVE_VRINTf32Z:
369     case MVE_VRSHL_by_vecs16:
370     case MVE_VRSHL_by_vecs32:
371     case MVE_VRSHL_by_vecs8:
372     case MVE_VRSHL_by_vecu16:
373     case MVE_VRSHL_by_vecu32:
374     case MVE_VRSHL_by_vecu8:
375     case MVE_VRSHL_qrs16:
376     case MVE_VRSHL_qrs32:
377     case MVE_VRSHL_qrs8:
378     case MVE_VRSHL_qru16:
379     case MVE_VRSHL_qru32:
380     case MVE_VRSHL_qru8:
381     case MVE_VRSHR_imms16:
382     case MVE_VRSHR_imms32:
383     case MVE_VRSHR_imms8:
384     case MVE_VRSHR_immu16:
385     case MVE_VRSHR_immu32:
386     case MVE_VRSHR_immu8:
387     case MVE_VSHL_by_vecs16:
388     case MVE_VSHL_by_vecs32:
389     case MVE_VSHL_by_vecs8:
390     case MVE_VSHL_by_vecu16:
391     case MVE_VSHL_by_vecu32:
392     case MVE_VSHL_by_vecu8:
393     case MVE_VSHL_immi16:
394     case MVE_VSHL_immi32:
395     case MVE_VSHL_immi8:
396     case MVE_VSHL_qrs16:
397     case MVE_VSHL_qrs32:
398     case MVE_VSHL_qrs8:
399     case MVE_VSHL_qru16:
400     case MVE_VSHL_qru32:
401     case MVE_VSHL_qru8:
402     case MVE_VSHR_imms16:
403     case MVE_VSHR_imms32:
404     case MVE_VSHR_imms8:
405     case MVE_VSHR_immu16:
406     case MVE_VSHR_immu32:
407     case MVE_VSHR_immu8:
408     case MVE_VSLIimm16:
409     case MVE_VSLIimm32:
410     case MVE_VSLIimm8:
411     case MVE_VSLIimms16:
412     case MVE_VSLIimms32:
413     case MVE_VSLIimms8:
414     case MVE_VSLIimmu16:
415     case MVE_VSLIimmu32:
416     case MVE_VSLIimmu8:
417     case MVE_VSRIimm16:
418     case MVE_VSRIimm32:
419     case MVE_VSRIimm8:
420     case MVE_VSTRB16:
421     case MVE_VSTRB16_post:
422     case MVE_VSTRB16_pre:
423     case MVE_VSTRB16_rq:
424     case MVE_VSTRB32:
425     case MVE_VSTRB32_post:
426     case MVE_VSTRB32_pre:
427     case MVE_VSTRB32_rq:
428     case MVE_VSTRB8_rq:
429     case MVE_VSTRBU8:
430     case MVE_VSTRBU8_post:
431     case MVE_VSTRBU8_pre:
432     case MVE_VSTRD64_qi:
433     case MVE_VSTRD64_qi_pre:
434     case MVE_VSTRD64_rq:
435     case MVE_VSTRD64_rq_u:
436     case MVE_VSTRH16_rq:
437     case MVE_VSTRH16_rq_u:
438     case MVE_VSTRH32:
439     case MVE_VSTRH32_post:
440     case MVE_VSTRH32_pre:
441     case MVE_VSTRH32_rq:
442     case MVE_VSTRH32_rq_u:
443     case MVE_VSTRHU16:
444     case MVE_VSTRHU16_post:
445     case MVE_VSTRHU16_pre:
446     case MVE_VSTRW32_qi:
447     case MVE_VSTRW32_qi_pre:
448     case MVE_VSTRW32_rq:
449     case MVE_VSTRW32_rq_u:
450     case MVE_VSTRWU32:
451     case MVE_VSTRWU32_post:
452     case MVE_VSTRWU32_pre:
453     case MVE_VSUB_qr_f16:
454     case MVE_VSUB_qr_f32:
455     case MVE_VSUB_qr_i16:
456     case MVE_VSUB_qr_i32:
457     case MVE_VSUB_qr_i8:
458     case MVE_VSUBf16:
459     case MVE_VSUBf32:
460     case MVE_VSUBi16:
461     case MVE_VSUBi32:
462     case MVE_VSUBi8:
463       return true;
464     }
465   };
466 
467   LLVMInitializeARMTargetInfo();
468   LLVMInitializeARMTarget();
469   LLVMInitializeARMTargetMC();
470 
471   auto TT(Triple::normalize("thumbv8.1m.main-arm-none-eabi"));
472   std::string Error;
473   const Target *T = TargetRegistry::lookupTarget(TT, Error);
474   if (!T) {
475     dbgs() << Error;
476     return;
477   }
478 
479   TargetOptions Options;
480   auto TM = std::unique_ptr<LLVMTargetMachine>(
481     static_cast<LLVMTargetMachine*>(
482       T->createTargetMachine(TT, "generic", "", Options, None, None,
483                              CodeGenOpt::Default)));
484   ARMSubtarget ST(TM->getTargetTriple(), TM->getTargetCPU(),
485                   TM->getTargetFeatureString(),
486                   *static_cast<const ARMBaseTargetMachine*>(TM.get()), false);
487   const ARMBaseInstrInfo *TII = ST.getInstrInfo();
488   auto MII = TM->getMCInstrInfo();
489 
490   for (unsigned i = 0; i < ARM::INSTRUCTION_LIST_END; ++i) {
491     const MCInstrDesc &Desc = TII->get(i);
492 
493     for (auto &Op : Desc.operands()) {
494       // Only check instructions that access the MQPR regs.
495       if ((Op.OperandType & MCOI::OPERAND_REGISTER) == 0 ||
496           Op.RegClass != ARM::MQPRRegClassID)
497         continue;
498 
499       uint64_t Flags = MII->get(i).TSFlags;
500       bool Valid = (Flags & ARMII::ValidForTailPredication) != 0;
501       ASSERT_EQ(IsValidTPOpcode(i), Valid)
502                 << MII->getName(i)
503                 << ": mismatched expectation for tail-predicated safety\n";
504       break;
505     }
506   }
507 }
508