xref: /freebsd-src/contrib/llvm-project/llvm/lib/Target/AMDGPU/AMDGPUPreLegalizerCombiner.cpp (revision 5ffd83dbcc34f10e07f6d3e968ae6365869615f4)
1*5ffd83dbSDimitry Andric //=== lib/CodeGen/GlobalISel/AMDGPUPreLegalizerCombiner.cpp ---------------===//
2*5ffd83dbSDimitry Andric //
3*5ffd83dbSDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*5ffd83dbSDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*5ffd83dbSDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*5ffd83dbSDimitry Andric //
7*5ffd83dbSDimitry Andric //===----------------------------------------------------------------------===//
8*5ffd83dbSDimitry Andric //
9*5ffd83dbSDimitry Andric // This pass does combining of machine instructions at the generic MI level,
10*5ffd83dbSDimitry Andric // before the legalizer.
11*5ffd83dbSDimitry Andric //
12*5ffd83dbSDimitry Andric //===----------------------------------------------------------------------===//
13*5ffd83dbSDimitry Andric 
14*5ffd83dbSDimitry Andric #include "AMDGPUTargetMachine.h"
15*5ffd83dbSDimitry Andric #include "llvm/CodeGen/GlobalISel/Combiner.h"
16*5ffd83dbSDimitry Andric #include "llvm/CodeGen/GlobalISel/CombinerHelper.h"
17*5ffd83dbSDimitry Andric #include "llvm/CodeGen/GlobalISel/CombinerInfo.h"
18*5ffd83dbSDimitry Andric #include "llvm/CodeGen/GlobalISel/GISelKnownBits.h"
19*5ffd83dbSDimitry Andric #include "llvm/CodeGen/GlobalISel/MIPatternMatch.h"
20*5ffd83dbSDimitry Andric #include "llvm/CodeGen/MachineDominators.h"
21*5ffd83dbSDimitry Andric #include "llvm/CodeGen/MachineFunctionPass.h"
22*5ffd83dbSDimitry Andric #include "llvm/CodeGen/TargetPassConfig.h"
23*5ffd83dbSDimitry Andric #include "llvm/Support/Debug.h"
24*5ffd83dbSDimitry Andric #include "MCTargetDesc/AMDGPUMCTargetDesc.h"
25*5ffd83dbSDimitry Andric 
26*5ffd83dbSDimitry Andric #define DEBUG_TYPE "amdgpu-prelegalizer-combiner"
27*5ffd83dbSDimitry Andric 
28*5ffd83dbSDimitry Andric using namespace llvm;
29*5ffd83dbSDimitry Andric using namespace MIPatternMatch;
30*5ffd83dbSDimitry Andric 
31*5ffd83dbSDimitry Andric #define AMDGPUPRELEGALIZERCOMBINERHELPER_GENCOMBINERHELPER_DEPS
32*5ffd83dbSDimitry Andric #include "AMDGPUGenPreLegalizeGICombiner.inc"
33*5ffd83dbSDimitry Andric #undef AMDGPUPRELEGALIZERCOMBINERHELPER_GENCOMBINERHELPER_DEPS
34*5ffd83dbSDimitry Andric 
35*5ffd83dbSDimitry Andric namespace {
36*5ffd83dbSDimitry Andric #define AMDGPUPRELEGALIZERCOMBINERHELPER_GENCOMBINERHELPER_H
37*5ffd83dbSDimitry Andric #include "AMDGPUGenPreLegalizeGICombiner.inc"
38*5ffd83dbSDimitry Andric #undef AMDGPUPRELEGALIZERCOMBINERHELPER_GENCOMBINERHELPER_H
39*5ffd83dbSDimitry Andric 
40*5ffd83dbSDimitry Andric class AMDGPUPreLegalizerCombinerInfo : public CombinerInfo {
41*5ffd83dbSDimitry Andric   GISelKnownBits *KB;
42*5ffd83dbSDimitry Andric   MachineDominatorTree *MDT;
43*5ffd83dbSDimitry Andric 
44*5ffd83dbSDimitry Andric public:
45*5ffd83dbSDimitry Andric   AMDGPUGenPreLegalizerCombinerHelperRuleConfig GeneratedRuleCfg;
46*5ffd83dbSDimitry Andric 
47*5ffd83dbSDimitry Andric   AMDGPUPreLegalizerCombinerInfo(bool EnableOpt, bool OptSize, bool MinSize,
48*5ffd83dbSDimitry Andric                                   GISelKnownBits *KB, MachineDominatorTree *MDT)
49*5ffd83dbSDimitry Andric       : CombinerInfo(/*AllowIllegalOps*/ true, /*ShouldLegalizeIllegal*/ false,
50*5ffd83dbSDimitry Andric                      /*LegalizerInfo*/ nullptr, EnableOpt, OptSize, MinSize),
51*5ffd83dbSDimitry Andric         KB(KB), MDT(MDT) {
52*5ffd83dbSDimitry Andric     if (!GeneratedRuleCfg.parseCommandLineOption())
53*5ffd83dbSDimitry Andric       report_fatal_error("Invalid rule identifier");
54*5ffd83dbSDimitry Andric   }
55*5ffd83dbSDimitry Andric 
56*5ffd83dbSDimitry Andric   virtual bool combine(GISelChangeObserver &Observer, MachineInstr &MI,
57*5ffd83dbSDimitry Andric                        MachineIRBuilder &B) const override;
58*5ffd83dbSDimitry Andric };
59*5ffd83dbSDimitry Andric 
60*5ffd83dbSDimitry Andric bool AMDGPUPreLegalizerCombinerInfo::combine(GISelChangeObserver &Observer,
61*5ffd83dbSDimitry Andric                                               MachineInstr &MI,
62*5ffd83dbSDimitry Andric                                               MachineIRBuilder &B) const {
63*5ffd83dbSDimitry Andric   CombinerHelper Helper(Observer, B, KB, MDT);
64*5ffd83dbSDimitry Andric   AMDGPUGenPreLegalizerCombinerHelper Generated(GeneratedRuleCfg);
65*5ffd83dbSDimitry Andric 
66*5ffd83dbSDimitry Andric   if (Generated.tryCombineAll(Observer, MI, B, Helper))
67*5ffd83dbSDimitry Andric     return true;
68*5ffd83dbSDimitry Andric 
69*5ffd83dbSDimitry Andric   switch (MI.getOpcode()) {
70*5ffd83dbSDimitry Andric   case TargetOpcode::G_CONCAT_VECTORS:
71*5ffd83dbSDimitry Andric     return Helper.tryCombineConcatVectors(MI);
72*5ffd83dbSDimitry Andric   case TargetOpcode::G_SHUFFLE_VECTOR:
73*5ffd83dbSDimitry Andric     return Helper.tryCombineShuffleVector(MI);
74*5ffd83dbSDimitry Andric   }
75*5ffd83dbSDimitry Andric 
76*5ffd83dbSDimitry Andric   return false;
77*5ffd83dbSDimitry Andric }
78*5ffd83dbSDimitry Andric 
79*5ffd83dbSDimitry Andric #define AMDGPUPRELEGALIZERCOMBINERHELPER_GENCOMBINERHELPER_CPP
80*5ffd83dbSDimitry Andric #include "AMDGPUGenPreLegalizeGICombiner.inc"
81*5ffd83dbSDimitry Andric #undef AMDGPUPRELEGALIZERCOMBINERHELPER_GENCOMBINERHELPER_CPP
82*5ffd83dbSDimitry Andric 
83*5ffd83dbSDimitry Andric // Pass boilerplate
84*5ffd83dbSDimitry Andric // ================
85*5ffd83dbSDimitry Andric 
86*5ffd83dbSDimitry Andric class AMDGPUPreLegalizerCombiner : public MachineFunctionPass {
87*5ffd83dbSDimitry Andric public:
88*5ffd83dbSDimitry Andric   static char ID;
89*5ffd83dbSDimitry Andric 
90*5ffd83dbSDimitry Andric   AMDGPUPreLegalizerCombiner(bool IsOptNone = false);
91*5ffd83dbSDimitry Andric 
92*5ffd83dbSDimitry Andric   StringRef getPassName() const override {
93*5ffd83dbSDimitry Andric     return "AMDGPUPreLegalizerCombiner";
94*5ffd83dbSDimitry Andric   }
95*5ffd83dbSDimitry Andric 
96*5ffd83dbSDimitry Andric   bool runOnMachineFunction(MachineFunction &MF) override;
97*5ffd83dbSDimitry Andric 
98*5ffd83dbSDimitry Andric   void getAnalysisUsage(AnalysisUsage &AU) const override;
99*5ffd83dbSDimitry Andric private:
100*5ffd83dbSDimitry Andric   bool IsOptNone;
101*5ffd83dbSDimitry Andric };
102*5ffd83dbSDimitry Andric } // end anonymous namespace
103*5ffd83dbSDimitry Andric 
104*5ffd83dbSDimitry Andric void AMDGPUPreLegalizerCombiner::getAnalysisUsage(AnalysisUsage &AU) const {
105*5ffd83dbSDimitry Andric   AU.addRequired<TargetPassConfig>();
106*5ffd83dbSDimitry Andric   AU.setPreservesCFG();
107*5ffd83dbSDimitry Andric   getSelectionDAGFallbackAnalysisUsage(AU);
108*5ffd83dbSDimitry Andric   AU.addRequired<GISelKnownBitsAnalysis>();
109*5ffd83dbSDimitry Andric   AU.addPreserved<GISelKnownBitsAnalysis>();
110*5ffd83dbSDimitry Andric   if (!IsOptNone) {
111*5ffd83dbSDimitry Andric     AU.addRequired<MachineDominatorTree>();
112*5ffd83dbSDimitry Andric     AU.addPreserved<MachineDominatorTree>();
113*5ffd83dbSDimitry Andric   }
114*5ffd83dbSDimitry Andric   MachineFunctionPass::getAnalysisUsage(AU);
115*5ffd83dbSDimitry Andric }
116*5ffd83dbSDimitry Andric 
117*5ffd83dbSDimitry Andric AMDGPUPreLegalizerCombiner::AMDGPUPreLegalizerCombiner(bool IsOptNone)
118*5ffd83dbSDimitry Andric   : MachineFunctionPass(ID), IsOptNone(IsOptNone) {
119*5ffd83dbSDimitry Andric   initializeAMDGPUPreLegalizerCombinerPass(*PassRegistry::getPassRegistry());
120*5ffd83dbSDimitry Andric }
121*5ffd83dbSDimitry Andric 
122*5ffd83dbSDimitry Andric bool AMDGPUPreLegalizerCombiner::runOnMachineFunction(MachineFunction &MF) {
123*5ffd83dbSDimitry Andric   if (MF.getProperties().hasProperty(
124*5ffd83dbSDimitry Andric           MachineFunctionProperties::Property::FailedISel))
125*5ffd83dbSDimitry Andric     return false;
126*5ffd83dbSDimitry Andric   auto *TPC = &getAnalysis<TargetPassConfig>();
127*5ffd83dbSDimitry Andric   const Function &F = MF.getFunction();
128*5ffd83dbSDimitry Andric   bool EnableOpt =
129*5ffd83dbSDimitry Andric       MF.getTarget().getOptLevel() != CodeGenOpt::None && !skipFunction(F);
130*5ffd83dbSDimitry Andric   GISelKnownBits *KB = &getAnalysis<GISelKnownBitsAnalysis>().get(MF);
131*5ffd83dbSDimitry Andric   MachineDominatorTree *MDT =
132*5ffd83dbSDimitry Andric       IsOptNone ? nullptr : &getAnalysis<MachineDominatorTree>();
133*5ffd83dbSDimitry Andric   AMDGPUPreLegalizerCombinerInfo PCInfo(EnableOpt, F.hasOptSize(),
134*5ffd83dbSDimitry Andric                                         F.hasMinSize(), KB, MDT);
135*5ffd83dbSDimitry Andric   Combiner C(PCInfo, TPC);
136*5ffd83dbSDimitry Andric   return C.combineMachineInstrs(MF, /*CSEInfo*/ nullptr);
137*5ffd83dbSDimitry Andric }
138*5ffd83dbSDimitry Andric 
139*5ffd83dbSDimitry Andric char AMDGPUPreLegalizerCombiner::ID = 0;
140*5ffd83dbSDimitry Andric INITIALIZE_PASS_BEGIN(AMDGPUPreLegalizerCombiner, DEBUG_TYPE,
141*5ffd83dbSDimitry Andric                       "Combine AMDGPU machine instrs before legalization",
142*5ffd83dbSDimitry Andric                       false, false)
143*5ffd83dbSDimitry Andric INITIALIZE_PASS_DEPENDENCY(TargetPassConfig)
144*5ffd83dbSDimitry Andric INITIALIZE_PASS_DEPENDENCY(GISelKnownBitsAnalysis)
145*5ffd83dbSDimitry Andric INITIALIZE_PASS_END(AMDGPUPreLegalizerCombiner, DEBUG_TYPE,
146*5ffd83dbSDimitry Andric                     "Combine AMDGPU machine instrs before legalization", false,
147*5ffd83dbSDimitry Andric                     false)
148*5ffd83dbSDimitry Andric 
149*5ffd83dbSDimitry Andric namespace llvm {
150*5ffd83dbSDimitry Andric FunctionPass *createAMDGPUPreLegalizeCombiner(bool IsOptNone) {
151*5ffd83dbSDimitry Andric   return new AMDGPUPreLegalizerCombiner(IsOptNone);
152*5ffd83dbSDimitry Andric }
153*5ffd83dbSDimitry Andric } // end namespace llvm
154