1 //===-- GCNHazardRecognizers.h - GCN Hazard Recognizers ---------*- C++ -*-===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file defines hazard recognizers for scheduling on GCN processors. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #ifndef LLVM_LIB_TARGET_AMDGPUHAZARDRECOGNIZERS_H 14 #define LLVM_LIB_TARGET_AMDGPUHAZARDRECOGNIZERS_H 15 16 #include "llvm/ADT/BitVector.h" 17 #include "llvm/ADT/STLExtras.h" 18 #include "llvm/CodeGen/ScheduleHazardRecognizer.h" 19 #include "llvm/CodeGen/TargetSchedule.h" 20 #include <list> 21 22 namespace llvm { 23 24 class MachineFunction; 25 class MachineInstr; 26 class MachineOperand; 27 class MachineRegisterInfo; 28 class SIInstrInfo; 29 class SIRegisterInfo; 30 class GCNSubtarget; 31 32 class GCNHazardRecognizer final : public ScheduleHazardRecognizer { 33 public: 34 typedef function_ref<bool(const MachineInstr &)> IsHazardFn; 35 36 private: 37 // Distinguish if we are called from scheduler or hazard recognizer 38 bool IsHazardRecognizerMode; 39 40 // This variable stores the instruction that has been emitted this cycle. It 41 // will be added to EmittedInstrs, when AdvanceCycle() or RecedeCycle() is 42 // called. 43 MachineInstr *CurrCycleInstr; 44 std::list<MachineInstr*> EmittedInstrs; 45 const MachineFunction &MF; 46 const GCNSubtarget &ST; 47 const SIInstrInfo &TII; 48 const SIRegisterInfo &TRI; 49 TargetSchedModel TSchedModel; 50 bool RunLdsBranchVmemWARHazardFixup; 51 52 /// RegUnits of uses in the current soft memory clause. 53 BitVector ClauseUses; 54 55 /// RegUnits of defs in the current soft memory clause. 56 BitVector ClauseDefs; 57 58 void resetClause() { 59 ClauseUses.reset(); 60 ClauseDefs.reset(); 61 } 62 63 void addClauseInst(const MachineInstr &MI); 64 65 /// \returns the number of wait states before another MFMA instruction can be 66 /// issued after \p MI. 67 unsigned getMFMAPipelineWaitStates(const MachineInstr &MI) const; 68 69 // Advance over a MachineInstr bundle. Look for hazards in the bundled 70 // instructions. 71 void processBundle(); 72 73 int getWaitStatesSince(IsHazardFn IsHazard, int Limit); 74 int getWaitStatesSinceDef(unsigned Reg, IsHazardFn IsHazardDef, int Limit); 75 int getWaitStatesSinceSetReg(IsHazardFn IsHazard, int Limit); 76 77 int checkSoftClauseHazards(MachineInstr *SMEM); 78 int checkSMRDHazards(MachineInstr *SMRD); 79 int checkVMEMHazards(MachineInstr* VMEM); 80 int checkDPPHazards(MachineInstr *DPP); 81 int checkDivFMasHazards(MachineInstr *DivFMas); 82 int checkGetRegHazards(MachineInstr *GetRegInstr); 83 int checkSetRegHazards(MachineInstr *SetRegInstr); 84 int createsVALUHazard(const MachineInstr &MI); 85 int checkVALUHazards(MachineInstr *VALU); 86 int checkVALUHazardsHelper(const MachineOperand &Def, const MachineRegisterInfo &MRI); 87 int checkRWLaneHazards(MachineInstr *RWLane); 88 int checkRFEHazards(MachineInstr *RFE); 89 int checkInlineAsmHazards(MachineInstr *IA); 90 int checkReadM0Hazards(MachineInstr *SMovRel); 91 int checkNSAtoVMEMHazard(MachineInstr *MI); 92 int checkFPAtomicToDenormModeHazard(MachineInstr *MI); 93 void fixHazards(MachineInstr *MI); 94 bool fixVcmpxPermlaneHazards(MachineInstr *MI); 95 bool fixVMEMtoScalarWriteHazards(MachineInstr *MI); 96 bool fixSMEMtoVectorWriteHazards(MachineInstr *MI); 97 bool fixVcmpxExecWARHazard(MachineInstr *MI); 98 bool fixLdsBranchVmemWARHazard(MachineInstr *MI); 99 bool fixVALUPartialForwardingHazard(MachineInstr *MI); 100 bool fixVALUTransUseHazard(MachineInstr *MI); 101 102 int checkMAIHazards(MachineInstr *MI); 103 int checkMAIHazards908(MachineInstr *MI); 104 int checkMAIHazards90A(MachineInstr *MI); 105 /// Pad the latency between neighboring MFMA instructions with s_nops. The 106 /// percentage of wait states to fill with s_nops is specified by the command 107 /// line option '-amdgpu-mfma-padding-ratio'. 108 /// 109 /// For example, with '-amdgpu-mfma-padding-ratio=100': 110 /// 111 /// 2 pass MFMA instructions have a latency of 2 wait states. Therefore, a 112 /// 'S_NOP 1' will be added between sequential MFMA instructions. 113 /// 114 /// V_MFMA_F32_4X4X1F32 115 /// V_MFMA_F32_4X4X1F32 116 ///--> 117 /// V_MFMA_F32_4X4X1F32 118 /// S_NOP 1 119 /// V_MFMA_F32_4X4X1F32 120 int checkMFMAPadding(MachineInstr *MI); 121 int checkMAIVALUHazards(MachineInstr *MI); 122 int checkMAILdStHazards(MachineInstr *MI); 123 124 public: 125 GCNHazardRecognizer(const MachineFunction &MF); 126 // We can only issue one instruction per cycle. 127 bool atIssueLimit() const override { return true; } 128 void EmitInstruction(SUnit *SU) override; 129 void EmitInstruction(MachineInstr *MI) override; 130 HazardType getHazardType(SUnit *SU, int Stalls) override; 131 void EmitNoop() override; 132 unsigned PreEmitNoops(MachineInstr *) override; 133 unsigned PreEmitNoopsCommon(MachineInstr *); 134 void AdvanceCycle() override; 135 void RecedeCycle() override; 136 bool ShouldPreferAnother(SUnit *SU) override; 137 void Reset() override; 138 }; 139 140 } // end namespace llvm 141 142 #endif //LLVM_LIB_TARGET_AMDGPUHAZARDRECOGNIZERS_H 143