17330f729Sjoerg //===------- HexagonCopyToCombine.cpp - Hexagon Copy-To-Combine Pass ------===//
27330f729Sjoerg //
37330f729Sjoerg // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
47330f729Sjoerg // See https://llvm.org/LICENSE.txt for license information.
57330f729Sjoerg // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
67330f729Sjoerg //
77330f729Sjoerg //===----------------------------------------------------------------------===//
87330f729Sjoerg // This pass replaces transfer instructions by combine instructions.
97330f729Sjoerg // We walk along a basic block and look for two combinable instructions and try
107330f729Sjoerg // to move them together. If we can move them next to each other we do so and
117330f729Sjoerg // replace them with a combine instruction.
127330f729Sjoerg //===----------------------------------------------------------------------===//
13*82d56013Sjoerg
147330f729Sjoerg #include "HexagonInstrInfo.h"
157330f729Sjoerg #include "HexagonSubtarget.h"
167330f729Sjoerg #include "llvm/ADT/DenseMap.h"
177330f729Sjoerg #include "llvm/ADT/DenseSet.h"
187330f729Sjoerg #include "llvm/CodeGen/MachineBasicBlock.h"
197330f729Sjoerg #include "llvm/CodeGen/MachineFunction.h"
207330f729Sjoerg #include "llvm/CodeGen/MachineFunctionPass.h"
217330f729Sjoerg #include "llvm/CodeGen/MachineInstr.h"
227330f729Sjoerg #include "llvm/CodeGen/MachineInstrBuilder.h"
237330f729Sjoerg #include "llvm/CodeGen/Passes.h"
247330f729Sjoerg #include "llvm/CodeGen/TargetRegisterInfo.h"
25*82d56013Sjoerg #include "llvm/Pass.h"
267330f729Sjoerg #include "llvm/Support/CodeGen.h"
277330f729Sjoerg #include "llvm/Support/CommandLine.h"
287330f729Sjoerg #include "llvm/Support/Debug.h"
297330f729Sjoerg #include "llvm/Support/raw_ostream.h"
30*82d56013Sjoerg #include "llvm/Target/TargetMachine.h"
317330f729Sjoerg
327330f729Sjoerg using namespace llvm;
337330f729Sjoerg
347330f729Sjoerg #define DEBUG_TYPE "hexagon-copy-combine"
357330f729Sjoerg
367330f729Sjoerg static
377330f729Sjoerg cl::opt<bool> IsCombinesDisabled("disable-merge-into-combines",
387330f729Sjoerg cl::Hidden, cl::ZeroOrMore,
397330f729Sjoerg cl::init(false),
407330f729Sjoerg cl::desc("Disable merging into combines"));
417330f729Sjoerg static
427330f729Sjoerg cl::opt<bool> IsConst64Disabled("disable-const64",
437330f729Sjoerg cl::Hidden, cl::ZeroOrMore,
447330f729Sjoerg cl::init(false),
457330f729Sjoerg cl::desc("Disable generation of const64"));
467330f729Sjoerg static
477330f729Sjoerg cl::opt<unsigned>
487330f729Sjoerg MaxNumOfInstsBetweenNewValueStoreAndTFR("max-num-inst-between-tfr-and-nv-store",
497330f729Sjoerg cl::Hidden, cl::init(4),
507330f729Sjoerg cl::desc("Maximum distance between a tfr feeding a store we "
517330f729Sjoerg "consider the store still to be newifiable"));
527330f729Sjoerg
537330f729Sjoerg namespace llvm {
547330f729Sjoerg FunctionPass *createHexagonCopyToCombine();
557330f729Sjoerg void initializeHexagonCopyToCombinePass(PassRegistry&);
567330f729Sjoerg }
577330f729Sjoerg
587330f729Sjoerg
597330f729Sjoerg namespace {
607330f729Sjoerg
617330f729Sjoerg class HexagonCopyToCombine : public MachineFunctionPass {
627330f729Sjoerg const HexagonInstrInfo *TII;
637330f729Sjoerg const TargetRegisterInfo *TRI;
647330f729Sjoerg const HexagonSubtarget *ST;
657330f729Sjoerg bool ShouldCombineAggressively;
667330f729Sjoerg
677330f729Sjoerg DenseSet<MachineInstr *> PotentiallyNewifiableTFR;
687330f729Sjoerg SmallVector<MachineInstr *, 8> DbgMItoMove;
697330f729Sjoerg
707330f729Sjoerg public:
717330f729Sjoerg static char ID;
727330f729Sjoerg
HexagonCopyToCombine()737330f729Sjoerg HexagonCopyToCombine() : MachineFunctionPass(ID) {
747330f729Sjoerg initializeHexagonCopyToCombinePass(*PassRegistry::getPassRegistry());
757330f729Sjoerg }
767330f729Sjoerg
getAnalysisUsage(AnalysisUsage & AU) const777330f729Sjoerg void getAnalysisUsage(AnalysisUsage &AU) const override {
787330f729Sjoerg MachineFunctionPass::getAnalysisUsage(AU);
797330f729Sjoerg }
807330f729Sjoerg
getPassName() const817330f729Sjoerg StringRef getPassName() const override {
827330f729Sjoerg return "Hexagon Copy-To-Combine Pass";
837330f729Sjoerg }
847330f729Sjoerg
857330f729Sjoerg bool runOnMachineFunction(MachineFunction &Fn) override;
867330f729Sjoerg
getRequiredProperties() const877330f729Sjoerg MachineFunctionProperties getRequiredProperties() const override {
887330f729Sjoerg return MachineFunctionProperties().set(
897330f729Sjoerg MachineFunctionProperties::Property::NoVRegs);
907330f729Sjoerg }
917330f729Sjoerg
927330f729Sjoerg private:
937330f729Sjoerg MachineInstr *findPairable(MachineInstr &I1, bool &DoInsertAtI1,
947330f729Sjoerg bool AllowC64);
957330f729Sjoerg
967330f729Sjoerg void findPotentialNewifiableTFRs(MachineBasicBlock &);
977330f729Sjoerg
987330f729Sjoerg void combine(MachineInstr &I1, MachineInstr &I2,
997330f729Sjoerg MachineBasicBlock::iterator &MI, bool DoInsertAtI1,
1007330f729Sjoerg bool OptForSize);
1017330f729Sjoerg
1027330f729Sjoerg bool isSafeToMoveTogether(MachineInstr &I1, MachineInstr &I2,
1037330f729Sjoerg unsigned I1DestReg, unsigned I2DestReg,
1047330f729Sjoerg bool &DoInsertAtI1);
1057330f729Sjoerg
1067330f729Sjoerg void emitCombineRR(MachineBasicBlock::iterator &Before, unsigned DestReg,
1077330f729Sjoerg MachineOperand &HiOperand, MachineOperand &LoOperand);
1087330f729Sjoerg
1097330f729Sjoerg void emitCombineRI(MachineBasicBlock::iterator &Before, unsigned DestReg,
1107330f729Sjoerg MachineOperand &HiOperand, MachineOperand &LoOperand);
1117330f729Sjoerg
1127330f729Sjoerg void emitCombineIR(MachineBasicBlock::iterator &Before, unsigned DestReg,
1137330f729Sjoerg MachineOperand &HiOperand, MachineOperand &LoOperand);
1147330f729Sjoerg
1157330f729Sjoerg void emitCombineII(MachineBasicBlock::iterator &Before, unsigned DestReg,
1167330f729Sjoerg MachineOperand &HiOperand, MachineOperand &LoOperand);
1177330f729Sjoerg
1187330f729Sjoerg void emitConst64(MachineBasicBlock::iterator &Before, unsigned DestReg,
1197330f729Sjoerg MachineOperand &HiOperand, MachineOperand &LoOperand);
1207330f729Sjoerg };
1217330f729Sjoerg
1227330f729Sjoerg } // End anonymous namespace.
1237330f729Sjoerg
1247330f729Sjoerg char HexagonCopyToCombine::ID = 0;
1257330f729Sjoerg
1267330f729Sjoerg INITIALIZE_PASS(HexagonCopyToCombine, "hexagon-copy-combine",
1277330f729Sjoerg "Hexagon Copy-To-Combine Pass", false, false)
1287330f729Sjoerg
isCombinableInstType(MachineInstr & MI,const HexagonInstrInfo * TII,bool ShouldCombineAggressively)1297330f729Sjoerg static bool isCombinableInstType(MachineInstr &MI, const HexagonInstrInfo *TII,
1307330f729Sjoerg bool ShouldCombineAggressively) {
1317330f729Sjoerg switch (MI.getOpcode()) {
1327330f729Sjoerg case Hexagon::A2_tfr: {
1337330f729Sjoerg // A COPY instruction can be combined if its arguments are IntRegs (32bit).
1347330f729Sjoerg const MachineOperand &Op0 = MI.getOperand(0);
1357330f729Sjoerg const MachineOperand &Op1 = MI.getOperand(1);
1367330f729Sjoerg assert(Op0.isReg() && Op1.isReg());
1377330f729Sjoerg
1387330f729Sjoerg Register DestReg = Op0.getReg();
1397330f729Sjoerg Register SrcReg = Op1.getReg();
1407330f729Sjoerg return Hexagon::IntRegsRegClass.contains(DestReg) &&
1417330f729Sjoerg Hexagon::IntRegsRegClass.contains(SrcReg);
1427330f729Sjoerg }
1437330f729Sjoerg
1447330f729Sjoerg case Hexagon::A2_tfrsi: {
1457330f729Sjoerg // A transfer-immediate can be combined if its argument is a signed 8bit
1467330f729Sjoerg // value.
1477330f729Sjoerg const MachineOperand &Op0 = MI.getOperand(0);
1487330f729Sjoerg const MachineOperand &Op1 = MI.getOperand(1);
1497330f729Sjoerg assert(Op0.isReg());
1507330f729Sjoerg
1517330f729Sjoerg Register DestReg = Op0.getReg();
1527330f729Sjoerg // Ensure that TargetFlags are MO_NO_FLAG for a global. This is a
1537330f729Sjoerg // workaround for an ABI bug that prevents GOT relocations on combine
1547330f729Sjoerg // instructions
1557330f729Sjoerg if (!Op1.isImm() && Op1.getTargetFlags() != HexagonII::MO_NO_FLAG)
1567330f729Sjoerg return false;
1577330f729Sjoerg
1587330f729Sjoerg // Only combine constant extended A2_tfrsi if we are in aggressive mode.
1597330f729Sjoerg bool NotExt = Op1.isImm() && isInt<8>(Op1.getImm());
1607330f729Sjoerg return Hexagon::IntRegsRegClass.contains(DestReg) &&
1617330f729Sjoerg (ShouldCombineAggressively || NotExt);
1627330f729Sjoerg }
1637330f729Sjoerg
1647330f729Sjoerg case Hexagon::V6_vassign:
1657330f729Sjoerg return true;
1667330f729Sjoerg
1677330f729Sjoerg default:
1687330f729Sjoerg break;
1697330f729Sjoerg }
1707330f729Sjoerg
1717330f729Sjoerg return false;
1727330f729Sjoerg }
1737330f729Sjoerg
isGreaterThanNBitTFRI(const MachineInstr & I)1747330f729Sjoerg template <unsigned N> static bool isGreaterThanNBitTFRI(const MachineInstr &I) {
1757330f729Sjoerg if (I.getOpcode() == Hexagon::TFRI64_V4 ||
1767330f729Sjoerg I.getOpcode() == Hexagon::A2_tfrsi) {
1777330f729Sjoerg const MachineOperand &Op = I.getOperand(1);
1787330f729Sjoerg return !Op.isImm() || !isInt<N>(Op.getImm());
1797330f729Sjoerg }
1807330f729Sjoerg return false;
1817330f729Sjoerg }
1827330f729Sjoerg
1837330f729Sjoerg /// areCombinableOperations - Returns true if the two instruction can be merge
1847330f729Sjoerg /// into a combine (ignoring register constraints).
areCombinableOperations(const TargetRegisterInfo * TRI,MachineInstr & HighRegInst,MachineInstr & LowRegInst,bool AllowC64)1857330f729Sjoerg static bool areCombinableOperations(const TargetRegisterInfo *TRI,
1867330f729Sjoerg MachineInstr &HighRegInst,
1877330f729Sjoerg MachineInstr &LowRegInst, bool AllowC64) {
1887330f729Sjoerg unsigned HiOpc = HighRegInst.getOpcode();
1897330f729Sjoerg unsigned LoOpc = LowRegInst.getOpcode();
1907330f729Sjoerg
1917330f729Sjoerg auto verifyOpc = [](unsigned Opc) -> void {
1927330f729Sjoerg switch (Opc) {
1937330f729Sjoerg case Hexagon::A2_tfr:
1947330f729Sjoerg case Hexagon::A2_tfrsi:
1957330f729Sjoerg case Hexagon::V6_vassign:
1967330f729Sjoerg break;
1977330f729Sjoerg default:
1987330f729Sjoerg llvm_unreachable("Unexpected opcode");
1997330f729Sjoerg }
2007330f729Sjoerg };
2017330f729Sjoerg verifyOpc(HiOpc);
2027330f729Sjoerg verifyOpc(LoOpc);
2037330f729Sjoerg
2047330f729Sjoerg if (HiOpc == Hexagon::V6_vassign || LoOpc == Hexagon::V6_vassign)
2057330f729Sjoerg return HiOpc == LoOpc;
2067330f729Sjoerg
2077330f729Sjoerg if (!AllowC64) {
2087330f729Sjoerg // There is no combine of two constant extended values.
2097330f729Sjoerg if (isGreaterThanNBitTFRI<8>(HighRegInst) &&
2107330f729Sjoerg isGreaterThanNBitTFRI<6>(LowRegInst))
2117330f729Sjoerg return false;
2127330f729Sjoerg }
2137330f729Sjoerg
2147330f729Sjoerg // There is a combine of two constant extended values into CONST64,
2157330f729Sjoerg // provided both constants are true immediates.
2167330f729Sjoerg if (isGreaterThanNBitTFRI<16>(HighRegInst) &&
217*82d56013Sjoerg isGreaterThanNBitTFRI<16>(LowRegInst) && !IsConst64Disabled)
2187330f729Sjoerg return (HighRegInst.getOperand(1).isImm() &&
2197330f729Sjoerg LowRegInst.getOperand(1).isImm());
2207330f729Sjoerg
2217330f729Sjoerg // There is no combine of two constant extended values, unless handled above
2227330f729Sjoerg // Make both 8-bit size checks to allow both combine (#,##) and combine(##,#)
2237330f729Sjoerg if (isGreaterThanNBitTFRI<8>(HighRegInst) &&
2247330f729Sjoerg isGreaterThanNBitTFRI<8>(LowRegInst))
2257330f729Sjoerg return false;
2267330f729Sjoerg
2277330f729Sjoerg return true;
2287330f729Sjoerg }
2297330f729Sjoerg
isEvenReg(unsigned Reg)2307330f729Sjoerg static bool isEvenReg(unsigned Reg) {
2317330f729Sjoerg assert(Register::isPhysicalRegister(Reg));
2327330f729Sjoerg if (Hexagon::IntRegsRegClass.contains(Reg))
2337330f729Sjoerg return (Reg - Hexagon::R0) % 2 == 0;
2347330f729Sjoerg if (Hexagon::HvxVRRegClass.contains(Reg))
2357330f729Sjoerg return (Reg - Hexagon::V0) % 2 == 0;
2367330f729Sjoerg llvm_unreachable("Invalid register");
2377330f729Sjoerg }
2387330f729Sjoerg
removeKillInfo(MachineInstr & MI,unsigned RegNotKilled)2397330f729Sjoerg static void removeKillInfo(MachineInstr &MI, unsigned RegNotKilled) {
2407330f729Sjoerg for (unsigned I = 0, E = MI.getNumOperands(); I != E; ++I) {
2417330f729Sjoerg MachineOperand &Op = MI.getOperand(I);
2427330f729Sjoerg if (!Op.isReg() || Op.getReg() != RegNotKilled || !Op.isKill())
2437330f729Sjoerg continue;
2447330f729Sjoerg Op.setIsKill(false);
2457330f729Sjoerg }
2467330f729Sjoerg }
2477330f729Sjoerg
2487330f729Sjoerg /// Returns true if it is unsafe to move a copy instruction from \p UseReg to
2497330f729Sjoerg /// \p DestReg over the instruction \p MI.
isUnsafeToMoveAcross(MachineInstr & MI,unsigned UseReg,unsigned DestReg,const TargetRegisterInfo * TRI)2507330f729Sjoerg static bool isUnsafeToMoveAcross(MachineInstr &MI, unsigned UseReg,
2517330f729Sjoerg unsigned DestReg,
2527330f729Sjoerg const TargetRegisterInfo *TRI) {
2537330f729Sjoerg return (UseReg && (MI.modifiesRegister(UseReg, TRI))) ||
2547330f729Sjoerg MI.modifiesRegister(DestReg, TRI) || MI.readsRegister(DestReg, TRI) ||
2557330f729Sjoerg MI.hasUnmodeledSideEffects() || MI.isInlineAsm() ||
2567330f729Sjoerg MI.isMetaInstruction();
2577330f729Sjoerg }
2587330f729Sjoerg
UseReg(const MachineOperand & MO)2597330f729Sjoerg static Register UseReg(const MachineOperand& MO) {
2607330f729Sjoerg return MO.isReg() ? MO.getReg() : Register();
2617330f729Sjoerg }
2627330f729Sjoerg
2637330f729Sjoerg /// isSafeToMoveTogether - Returns true if it is safe to move I1 next to I2 such
2647330f729Sjoerg /// that the two instructions can be paired in a combine.
isSafeToMoveTogether(MachineInstr & I1,MachineInstr & I2,unsigned I1DestReg,unsigned I2DestReg,bool & DoInsertAtI1)2657330f729Sjoerg bool HexagonCopyToCombine::isSafeToMoveTogether(MachineInstr &I1,
2667330f729Sjoerg MachineInstr &I2,
2677330f729Sjoerg unsigned I1DestReg,
2687330f729Sjoerg unsigned I2DestReg,
2697330f729Sjoerg bool &DoInsertAtI1) {
2707330f729Sjoerg Register I2UseReg = UseReg(I2.getOperand(1));
2717330f729Sjoerg
2727330f729Sjoerg // It is not safe to move I1 and I2 into one combine if I2 has a true
2737330f729Sjoerg // dependence on I1.
2747330f729Sjoerg if (I2UseReg && I1.modifiesRegister(I2UseReg, TRI))
2757330f729Sjoerg return false;
2767330f729Sjoerg
2777330f729Sjoerg bool isSafe = true;
2787330f729Sjoerg
2797330f729Sjoerg // First try to move I2 towards I1.
2807330f729Sjoerg {
2817330f729Sjoerg // A reverse_iterator instantiated like below starts before I2, and I1
2827330f729Sjoerg // respectively.
2837330f729Sjoerg // Look at instructions I in between I2 and (excluding) I1.
284*82d56013Sjoerg MachineBasicBlock::reverse_iterator I = ++I2.getIterator().getReverse();
285*82d56013Sjoerg MachineBasicBlock::reverse_iterator End = I1.getIterator().getReverse();
2867330f729Sjoerg // At 03 we got better results (dhrystone!) by being more conservative.
2877330f729Sjoerg if (!ShouldCombineAggressively)
288*82d56013Sjoerg End = ++I1.getIterator().getReverse();
2897330f729Sjoerg // If I2 kills its operand and we move I2 over an instruction that also
2907330f729Sjoerg // uses I2's use reg we need to modify that (first) instruction to now kill
2917330f729Sjoerg // this reg.
2927330f729Sjoerg unsigned KilledOperand = 0;
2937330f729Sjoerg if (I2.killsRegister(I2UseReg))
2947330f729Sjoerg KilledOperand = I2UseReg;
2957330f729Sjoerg MachineInstr *KillingInstr = nullptr;
2967330f729Sjoerg
2977330f729Sjoerg for (; I != End; ++I) {
2987330f729Sjoerg // If the intervening instruction I:
2997330f729Sjoerg // * modifies I2's use reg
3007330f729Sjoerg // * modifies I2's def reg
3017330f729Sjoerg // * reads I2's def reg
3027330f729Sjoerg // * or has unmodelled side effects
3037330f729Sjoerg // we can't move I2 across it.
3047330f729Sjoerg if (I->isDebugInstr())
3057330f729Sjoerg continue;
3067330f729Sjoerg
3077330f729Sjoerg if (isUnsafeToMoveAcross(*I, I2UseReg, I2DestReg, TRI)) {
3087330f729Sjoerg isSafe = false;
3097330f729Sjoerg break;
3107330f729Sjoerg }
3117330f729Sjoerg
3127330f729Sjoerg // Update first use of the killed operand.
3137330f729Sjoerg if (!KillingInstr && KilledOperand &&
3147330f729Sjoerg I->readsRegister(KilledOperand, TRI))
3157330f729Sjoerg KillingInstr = &*I;
3167330f729Sjoerg }
3177330f729Sjoerg if (isSafe) {
3187330f729Sjoerg // Update the intermediate instruction to with the kill flag.
3197330f729Sjoerg if (KillingInstr) {
3207330f729Sjoerg bool Added = KillingInstr->addRegisterKilled(KilledOperand, TRI, true);
3217330f729Sjoerg (void)Added; // suppress compiler warning
3227330f729Sjoerg assert(Added && "Must successfully update kill flag");
3237330f729Sjoerg removeKillInfo(I2, KilledOperand);
3247330f729Sjoerg }
3257330f729Sjoerg DoInsertAtI1 = true;
3267330f729Sjoerg return true;
3277330f729Sjoerg }
3287330f729Sjoerg }
3297330f729Sjoerg
3307330f729Sjoerg // Try to move I1 towards I2.
3317330f729Sjoerg {
3327330f729Sjoerg // Look at instructions I in between I1 and (excluding) I2.
3337330f729Sjoerg MachineBasicBlock::iterator I(I1), End(I2);
3347330f729Sjoerg // At O3 we got better results (dhrystone) by being more conservative here.
3357330f729Sjoerg if (!ShouldCombineAggressively)
3367330f729Sjoerg End = std::next(MachineBasicBlock::iterator(I2));
3377330f729Sjoerg Register I1UseReg = UseReg(I1.getOperand(1));
3387330f729Sjoerg // Track killed operands. If we move across an instruction that kills our
3397330f729Sjoerg // operand, we need to update the kill information on the moved I1. It kills
3407330f729Sjoerg // the operand now.
3417330f729Sjoerg MachineInstr *KillingInstr = nullptr;
3427330f729Sjoerg unsigned KilledOperand = 0;
3437330f729Sjoerg
3447330f729Sjoerg while(++I != End) {
3457330f729Sjoerg MachineInstr &MI = *I;
3467330f729Sjoerg // If the intervening instruction MI:
3477330f729Sjoerg // * modifies I1's use reg
3487330f729Sjoerg // * modifies I1's def reg
3497330f729Sjoerg // * reads I1's def reg
3507330f729Sjoerg // * or has unmodelled side effects
3517330f729Sjoerg // We introduce this special case because llvm has no api to remove a
3527330f729Sjoerg // kill flag for a register (a removeRegisterKilled() analogous to
3537330f729Sjoerg // addRegisterKilled) that handles aliased register correctly.
3547330f729Sjoerg // * or has a killed aliased register use of I1's use reg
3557330f729Sjoerg // %d4 = A2_tfrpi 16
3567330f729Sjoerg // %r6 = A2_tfr %r9
3577330f729Sjoerg // %r8 = KILL %r8, implicit killed %d4
3587330f729Sjoerg // If we want to move R6 = across the KILL instruction we would have
3597330f729Sjoerg // to remove the implicit killed %d4 operand. For now, we are
3607330f729Sjoerg // conservative and disallow the move.
3617330f729Sjoerg // we can't move I1 across it.
3627330f729Sjoerg if (MI.isDebugInstr()) {
3637330f729Sjoerg if (MI.readsRegister(I1DestReg, TRI)) // Move this instruction after I2.
3647330f729Sjoerg DbgMItoMove.push_back(&MI);
3657330f729Sjoerg continue;
3667330f729Sjoerg }
3677330f729Sjoerg
3687330f729Sjoerg if (isUnsafeToMoveAcross(MI, I1UseReg, I1DestReg, TRI) ||
3697330f729Sjoerg // Check for an aliased register kill. Bail out if we see one.
3707330f729Sjoerg (!MI.killsRegister(I1UseReg) && MI.killsRegister(I1UseReg, TRI)))
3717330f729Sjoerg return false;
3727330f729Sjoerg
3737330f729Sjoerg // Check for an exact kill (registers match).
3747330f729Sjoerg if (I1UseReg && MI.killsRegister(I1UseReg)) {
3757330f729Sjoerg assert(!KillingInstr && "Should only see one killing instruction");
3767330f729Sjoerg KilledOperand = I1UseReg;
3777330f729Sjoerg KillingInstr = &MI;
3787330f729Sjoerg }
3797330f729Sjoerg }
3807330f729Sjoerg if (KillingInstr) {
3817330f729Sjoerg removeKillInfo(*KillingInstr, KilledOperand);
3827330f729Sjoerg // Update I1 to set the kill flag. This flag will later be picked up by
3837330f729Sjoerg // the new COMBINE instruction.
3847330f729Sjoerg bool Added = I1.addRegisterKilled(KilledOperand, TRI);
3857330f729Sjoerg (void)Added; // suppress compiler warning
3867330f729Sjoerg assert(Added && "Must successfully update kill flag");
3877330f729Sjoerg }
3887330f729Sjoerg DoInsertAtI1 = false;
3897330f729Sjoerg }
3907330f729Sjoerg
3917330f729Sjoerg return true;
3927330f729Sjoerg }
3937330f729Sjoerg
3947330f729Sjoerg /// findPotentialNewifiableTFRs - Finds tranfers that feed stores that could be
3957330f729Sjoerg /// newified. (A use of a 64 bit register define can not be newified)
3967330f729Sjoerg void
findPotentialNewifiableTFRs(MachineBasicBlock & BB)3977330f729Sjoerg HexagonCopyToCombine::findPotentialNewifiableTFRs(MachineBasicBlock &BB) {
3987330f729Sjoerg DenseMap<unsigned, MachineInstr *> LastDef;
3997330f729Sjoerg for (MachineInstr &MI : BB) {
4007330f729Sjoerg if (MI.isDebugInstr())
4017330f729Sjoerg continue;
4027330f729Sjoerg
4037330f729Sjoerg // Mark TFRs that feed a potential new value store as such.
4047330f729Sjoerg if (TII->mayBeNewStore(MI)) {
4057330f729Sjoerg // Look for uses of TFR instructions.
4067330f729Sjoerg for (unsigned OpdIdx = 0, OpdE = MI.getNumOperands(); OpdIdx != OpdE;
4077330f729Sjoerg ++OpdIdx) {
4087330f729Sjoerg MachineOperand &Op = MI.getOperand(OpdIdx);
4097330f729Sjoerg
4107330f729Sjoerg // Skip over anything except register uses.
4117330f729Sjoerg if (!Op.isReg() || !Op.isUse() || !Op.getReg())
4127330f729Sjoerg continue;
4137330f729Sjoerg
4147330f729Sjoerg // Look for the defining instruction.
4157330f729Sjoerg Register Reg = Op.getReg();
4167330f729Sjoerg MachineInstr *DefInst = LastDef[Reg];
4177330f729Sjoerg if (!DefInst)
4187330f729Sjoerg continue;
4197330f729Sjoerg if (!isCombinableInstType(*DefInst, TII, ShouldCombineAggressively))
4207330f729Sjoerg continue;
4217330f729Sjoerg
4227330f729Sjoerg // Only close newifiable stores should influence the decision.
4237330f729Sjoerg // Ignore the debug instructions in between.
4247330f729Sjoerg MachineBasicBlock::iterator It(DefInst);
4257330f729Sjoerg unsigned NumInstsToDef = 0;
4267330f729Sjoerg while (&*It != &MI) {
4277330f729Sjoerg if (!It->isDebugInstr())
4287330f729Sjoerg ++NumInstsToDef;
4297330f729Sjoerg ++It;
4307330f729Sjoerg }
4317330f729Sjoerg
4327330f729Sjoerg if (NumInstsToDef > MaxNumOfInstsBetweenNewValueStoreAndTFR)
4337330f729Sjoerg continue;
4347330f729Sjoerg
4357330f729Sjoerg PotentiallyNewifiableTFR.insert(DefInst);
4367330f729Sjoerg }
4377330f729Sjoerg // Skip to next instruction.
4387330f729Sjoerg continue;
4397330f729Sjoerg }
4407330f729Sjoerg
4417330f729Sjoerg // Put instructions that last defined integer or double registers into the
4427330f729Sjoerg // map.
4437330f729Sjoerg for (MachineOperand &Op : MI.operands()) {
4447330f729Sjoerg if (Op.isReg()) {
4457330f729Sjoerg if (!Op.isDef() || !Op.getReg())
4467330f729Sjoerg continue;
4477330f729Sjoerg Register Reg = Op.getReg();
4487330f729Sjoerg if (Hexagon::DoubleRegsRegClass.contains(Reg)) {
4497330f729Sjoerg for (MCSubRegIterator SubRegs(Reg, TRI); SubRegs.isValid(); ++SubRegs)
4507330f729Sjoerg LastDef[*SubRegs] = &MI;
4517330f729Sjoerg } else if (Hexagon::IntRegsRegClass.contains(Reg))
4527330f729Sjoerg LastDef[Reg] = &MI;
4537330f729Sjoerg } else if (Op.isRegMask()) {
4547330f729Sjoerg for (unsigned Reg : Hexagon::IntRegsRegClass)
4557330f729Sjoerg if (Op.clobbersPhysReg(Reg))
4567330f729Sjoerg LastDef[Reg] = &MI;
4577330f729Sjoerg }
4587330f729Sjoerg }
4597330f729Sjoerg }
4607330f729Sjoerg }
4617330f729Sjoerg
runOnMachineFunction(MachineFunction & MF)4627330f729Sjoerg bool HexagonCopyToCombine::runOnMachineFunction(MachineFunction &MF) {
4637330f729Sjoerg if (skipFunction(MF.getFunction()))
4647330f729Sjoerg return false;
4657330f729Sjoerg
4667330f729Sjoerg if (IsCombinesDisabled) return false;
4677330f729Sjoerg
4687330f729Sjoerg bool HasChanged = false;
4697330f729Sjoerg
4707330f729Sjoerg // Get target info.
4717330f729Sjoerg ST = &MF.getSubtarget<HexagonSubtarget>();
4727330f729Sjoerg TRI = ST->getRegisterInfo();
4737330f729Sjoerg TII = ST->getInstrInfo();
4747330f729Sjoerg
4757330f729Sjoerg const Function &F = MF.getFunction();
4767330f729Sjoerg bool OptForSize = F.hasFnAttribute(Attribute::OptimizeForSize);
4777330f729Sjoerg
4787330f729Sjoerg // Combine aggressively (for code size)
4797330f729Sjoerg ShouldCombineAggressively =
4807330f729Sjoerg MF.getTarget().getOptLevel() <= CodeGenOpt::Default;
4817330f729Sjoerg
482*82d56013Sjoerg // Disable CONST64 for tiny core since it takes a LD resource.
483*82d56013Sjoerg if (!OptForSize && ST->isTinyCore())
484*82d56013Sjoerg IsConst64Disabled = true;
485*82d56013Sjoerg
4867330f729Sjoerg // Traverse basic blocks.
4877330f729Sjoerg for (MachineFunction::iterator BI = MF.begin(), BE = MF.end(); BI != BE;
4887330f729Sjoerg ++BI) {
4897330f729Sjoerg PotentiallyNewifiableTFR.clear();
4907330f729Sjoerg findPotentialNewifiableTFRs(*BI);
4917330f729Sjoerg
4927330f729Sjoerg // Traverse instructions in basic block.
4937330f729Sjoerg for(MachineBasicBlock::iterator MI = BI->begin(), End = BI->end();
4947330f729Sjoerg MI != End;) {
4957330f729Sjoerg MachineInstr &I1 = *MI++;
4967330f729Sjoerg
4977330f729Sjoerg if (I1.isDebugInstr())
4987330f729Sjoerg continue;
4997330f729Sjoerg
5007330f729Sjoerg // Don't combine a TFR whose user could be newified (instructions that
5017330f729Sjoerg // define double registers can not be newified - Programmer's Ref Manual
5027330f729Sjoerg // 5.4.2 New-value stores).
5037330f729Sjoerg if (ShouldCombineAggressively && PotentiallyNewifiableTFR.count(&I1))
5047330f729Sjoerg continue;
5057330f729Sjoerg
5067330f729Sjoerg // Ignore instructions that are not combinable.
5077330f729Sjoerg if (!isCombinableInstType(I1, TII, ShouldCombineAggressively))
5087330f729Sjoerg continue;
5097330f729Sjoerg
5107330f729Sjoerg // Find a second instruction that can be merged into a combine
5117330f729Sjoerg // instruction. In addition, also find all the debug instructions that
5127330f729Sjoerg // need to be moved along with it.
5137330f729Sjoerg bool DoInsertAtI1 = false;
5147330f729Sjoerg DbgMItoMove.clear();
5157330f729Sjoerg MachineInstr *I2 = findPairable(I1, DoInsertAtI1, OptForSize);
5167330f729Sjoerg if (I2) {
5177330f729Sjoerg HasChanged = true;
5187330f729Sjoerg combine(I1, *I2, MI, DoInsertAtI1, OptForSize);
5197330f729Sjoerg }
5207330f729Sjoerg }
5217330f729Sjoerg }
5227330f729Sjoerg
5237330f729Sjoerg return HasChanged;
5247330f729Sjoerg }
5257330f729Sjoerg
5267330f729Sjoerg /// findPairable - Returns an instruction that can be merged with \p I1 into a
5277330f729Sjoerg /// COMBINE instruction or 0 if no such instruction can be found. Returns true
5287330f729Sjoerg /// in \p DoInsertAtI1 if the combine must be inserted at instruction \p I1
5297330f729Sjoerg /// false if the combine must be inserted at the returned instruction.
findPairable(MachineInstr & I1,bool & DoInsertAtI1,bool AllowC64)5307330f729Sjoerg MachineInstr *HexagonCopyToCombine::findPairable(MachineInstr &I1,
5317330f729Sjoerg bool &DoInsertAtI1,
5327330f729Sjoerg bool AllowC64) {
5337330f729Sjoerg MachineBasicBlock::iterator I2 = std::next(MachineBasicBlock::iterator(I1));
5347330f729Sjoerg while (I2 != I1.getParent()->end() && I2->isDebugInstr())
5357330f729Sjoerg ++I2;
5367330f729Sjoerg
5377330f729Sjoerg Register I1DestReg = I1.getOperand(0).getReg();
5387330f729Sjoerg
5397330f729Sjoerg for (MachineBasicBlock::iterator End = I1.getParent()->end(); I2 != End;
5407330f729Sjoerg ++I2) {
5417330f729Sjoerg // Bail out early if we see a second definition of I1DestReg.
5427330f729Sjoerg if (I2->modifiesRegister(I1DestReg, TRI))
5437330f729Sjoerg break;
5447330f729Sjoerg
5457330f729Sjoerg // Ignore non-combinable instructions.
5467330f729Sjoerg if (!isCombinableInstType(*I2, TII, ShouldCombineAggressively))
5477330f729Sjoerg continue;
5487330f729Sjoerg
5497330f729Sjoerg // Don't combine a TFR whose user could be newified.
5507330f729Sjoerg if (ShouldCombineAggressively && PotentiallyNewifiableTFR.count(&*I2))
5517330f729Sjoerg continue;
5527330f729Sjoerg
5537330f729Sjoerg Register I2DestReg = I2->getOperand(0).getReg();
5547330f729Sjoerg
5557330f729Sjoerg // Check that registers are adjacent and that the first destination register
5567330f729Sjoerg // is even.
5577330f729Sjoerg bool IsI1LowReg = (I2DestReg - I1DestReg) == 1;
5587330f729Sjoerg bool IsI2LowReg = (I1DestReg - I2DestReg) == 1;
5597330f729Sjoerg unsigned FirstRegIndex = IsI1LowReg ? I1DestReg : I2DestReg;
5607330f729Sjoerg if ((!IsI1LowReg && !IsI2LowReg) || !isEvenReg(FirstRegIndex))
5617330f729Sjoerg continue;
5627330f729Sjoerg
5637330f729Sjoerg // Check that the two instructions are combinable.
5647330f729Sjoerg // The order matters because in a A2_tfrsi we might can encode a int8 as
5657330f729Sjoerg // the hi reg operand but only a uint6 as the low reg operand.
5667330f729Sjoerg if ((IsI2LowReg && !areCombinableOperations(TRI, I1, *I2, AllowC64)) ||
5677330f729Sjoerg (IsI1LowReg && !areCombinableOperations(TRI, *I2, I1, AllowC64)))
5687330f729Sjoerg break;
5697330f729Sjoerg
5707330f729Sjoerg if (isSafeToMoveTogether(I1, *I2, I1DestReg, I2DestReg, DoInsertAtI1))
5717330f729Sjoerg return &*I2;
5727330f729Sjoerg
5737330f729Sjoerg // Not safe. Stop searching.
5747330f729Sjoerg break;
5757330f729Sjoerg }
5767330f729Sjoerg return nullptr;
5777330f729Sjoerg }
5787330f729Sjoerg
combine(MachineInstr & I1,MachineInstr & I2,MachineBasicBlock::iterator & MI,bool DoInsertAtI1,bool OptForSize)5797330f729Sjoerg void HexagonCopyToCombine::combine(MachineInstr &I1, MachineInstr &I2,
5807330f729Sjoerg MachineBasicBlock::iterator &MI,
5817330f729Sjoerg bool DoInsertAtI1, bool OptForSize) {
5827330f729Sjoerg // We are going to delete I2. If MI points to I2 advance it to the next
5837330f729Sjoerg // instruction.
5847330f729Sjoerg if (MI == I2.getIterator())
5857330f729Sjoerg ++MI;
5867330f729Sjoerg
5877330f729Sjoerg // Figure out whether I1 or I2 goes into the lowreg part.
5887330f729Sjoerg Register I1DestReg = I1.getOperand(0).getReg();
5897330f729Sjoerg Register I2DestReg = I2.getOperand(0).getReg();
5907330f729Sjoerg bool IsI1Loreg = (I2DestReg - I1DestReg) == 1;
5917330f729Sjoerg unsigned LoRegDef = IsI1Loreg ? I1DestReg : I2DestReg;
5927330f729Sjoerg unsigned SubLo;
5937330f729Sjoerg
5947330f729Sjoerg const TargetRegisterClass *SuperRC = nullptr;
5957330f729Sjoerg if (Hexagon::IntRegsRegClass.contains(LoRegDef)) {
5967330f729Sjoerg SuperRC = &Hexagon::DoubleRegsRegClass;
5977330f729Sjoerg SubLo = Hexagon::isub_lo;
5987330f729Sjoerg } else if (Hexagon::HvxVRRegClass.contains(LoRegDef)) {
5997330f729Sjoerg assert(ST->useHVXOps());
6007330f729Sjoerg SuperRC = &Hexagon::HvxWRRegClass;
6017330f729Sjoerg SubLo = Hexagon::vsub_lo;
6027330f729Sjoerg } else
6037330f729Sjoerg llvm_unreachable("Unexpected register class");
6047330f729Sjoerg
6057330f729Sjoerg // Get the double word register.
6067330f729Sjoerg unsigned DoubleRegDest = TRI->getMatchingSuperReg(LoRegDef, SubLo, SuperRC);
6077330f729Sjoerg assert(DoubleRegDest != 0 && "Expect a valid register");
6087330f729Sjoerg
6097330f729Sjoerg // Setup source operands.
6107330f729Sjoerg MachineOperand &LoOperand = IsI1Loreg ? I1.getOperand(1) : I2.getOperand(1);
6117330f729Sjoerg MachineOperand &HiOperand = IsI1Loreg ? I2.getOperand(1) : I1.getOperand(1);
6127330f729Sjoerg
6137330f729Sjoerg // Figure out which source is a register and which a constant.
6147330f729Sjoerg bool IsHiReg = HiOperand.isReg();
6157330f729Sjoerg bool IsLoReg = LoOperand.isReg();
6167330f729Sjoerg
6177330f729Sjoerg // There is a combine of two constant extended values into CONST64.
6187330f729Sjoerg bool IsC64 = OptForSize && LoOperand.isImm() && HiOperand.isImm() &&
6197330f729Sjoerg isGreaterThanNBitTFRI<16>(I1) && isGreaterThanNBitTFRI<16>(I2);
6207330f729Sjoerg
6217330f729Sjoerg MachineBasicBlock::iterator InsertPt(DoInsertAtI1 ? I1 : I2);
6227330f729Sjoerg // Emit combine.
6237330f729Sjoerg if (IsHiReg && IsLoReg)
6247330f729Sjoerg emitCombineRR(InsertPt, DoubleRegDest, HiOperand, LoOperand);
6257330f729Sjoerg else if (IsHiReg)
6267330f729Sjoerg emitCombineRI(InsertPt, DoubleRegDest, HiOperand, LoOperand);
6277330f729Sjoerg else if (IsLoReg)
6287330f729Sjoerg emitCombineIR(InsertPt, DoubleRegDest, HiOperand, LoOperand);
6297330f729Sjoerg else if (IsC64 && !IsConst64Disabled)
6307330f729Sjoerg emitConst64(InsertPt, DoubleRegDest, HiOperand, LoOperand);
6317330f729Sjoerg else
6327330f729Sjoerg emitCombineII(InsertPt, DoubleRegDest, HiOperand, LoOperand);
6337330f729Sjoerg
6347330f729Sjoerg // Move debug instructions along with I1 if it's being
6357330f729Sjoerg // moved towards I2.
6367330f729Sjoerg if (!DoInsertAtI1 && DbgMItoMove.size() != 0) {
6377330f729Sjoerg // Insert debug instructions at the new location before I2.
6387330f729Sjoerg MachineBasicBlock *BB = InsertPt->getParent();
6397330f729Sjoerg for (auto NewMI : DbgMItoMove) {
6407330f729Sjoerg // If iterator MI is pointing to DEBUG_VAL, make sure
6417330f729Sjoerg // MI now points to next relevant instruction.
6427330f729Sjoerg if (NewMI == MI)
6437330f729Sjoerg ++MI;
6447330f729Sjoerg BB->splice(InsertPt, BB, NewMI);
6457330f729Sjoerg }
6467330f729Sjoerg }
6477330f729Sjoerg
6487330f729Sjoerg I1.eraseFromParent();
6497330f729Sjoerg I2.eraseFromParent();
6507330f729Sjoerg }
6517330f729Sjoerg
emitConst64(MachineBasicBlock::iterator & InsertPt,unsigned DoubleDestReg,MachineOperand & HiOperand,MachineOperand & LoOperand)6527330f729Sjoerg void HexagonCopyToCombine::emitConst64(MachineBasicBlock::iterator &InsertPt,
6537330f729Sjoerg unsigned DoubleDestReg,
6547330f729Sjoerg MachineOperand &HiOperand,
6557330f729Sjoerg MachineOperand &LoOperand) {
6567330f729Sjoerg LLVM_DEBUG(dbgs() << "Found a CONST64\n");
6577330f729Sjoerg
6587330f729Sjoerg DebugLoc DL = InsertPt->getDebugLoc();
6597330f729Sjoerg MachineBasicBlock *BB = InsertPt->getParent();
6607330f729Sjoerg assert(LoOperand.isImm() && HiOperand.isImm() &&
6617330f729Sjoerg "Both operands must be immediate");
6627330f729Sjoerg
6637330f729Sjoerg int64_t V = HiOperand.getImm();
6647330f729Sjoerg V = (V << 32) | (0x0ffffffffLL & LoOperand.getImm());
6657330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::CONST64), DoubleDestReg)
6667330f729Sjoerg .addImm(V);
6677330f729Sjoerg }
6687330f729Sjoerg
emitCombineII(MachineBasicBlock::iterator & InsertPt,unsigned DoubleDestReg,MachineOperand & HiOperand,MachineOperand & LoOperand)6697330f729Sjoerg void HexagonCopyToCombine::emitCombineII(MachineBasicBlock::iterator &InsertPt,
6707330f729Sjoerg unsigned DoubleDestReg,
6717330f729Sjoerg MachineOperand &HiOperand,
6727330f729Sjoerg MachineOperand &LoOperand) {
6737330f729Sjoerg DebugLoc DL = InsertPt->getDebugLoc();
6747330f729Sjoerg MachineBasicBlock *BB = InsertPt->getParent();
6757330f729Sjoerg
6767330f729Sjoerg // Handle globals.
6777330f729Sjoerg if (HiOperand.isGlobal()) {
6787330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
6797330f729Sjoerg .addGlobalAddress(HiOperand.getGlobal(), HiOperand.getOffset(),
6807330f729Sjoerg HiOperand.getTargetFlags())
6817330f729Sjoerg .addImm(LoOperand.getImm());
6827330f729Sjoerg return;
6837330f729Sjoerg }
6847330f729Sjoerg if (LoOperand.isGlobal()) {
6857330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
6867330f729Sjoerg .addImm(HiOperand.getImm())
6877330f729Sjoerg .addGlobalAddress(LoOperand.getGlobal(), LoOperand.getOffset(),
6887330f729Sjoerg LoOperand.getTargetFlags());
6897330f729Sjoerg return;
6907330f729Sjoerg }
6917330f729Sjoerg
6927330f729Sjoerg // Handle block addresses.
6937330f729Sjoerg if (HiOperand.isBlockAddress()) {
6947330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
6957330f729Sjoerg .addBlockAddress(HiOperand.getBlockAddress(), HiOperand.getOffset(),
6967330f729Sjoerg HiOperand.getTargetFlags())
6977330f729Sjoerg .addImm(LoOperand.getImm());
6987330f729Sjoerg return;
6997330f729Sjoerg }
7007330f729Sjoerg if (LoOperand.isBlockAddress()) {
7017330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
7027330f729Sjoerg .addImm(HiOperand.getImm())
7037330f729Sjoerg .addBlockAddress(LoOperand.getBlockAddress(), LoOperand.getOffset(),
7047330f729Sjoerg LoOperand.getTargetFlags());
7057330f729Sjoerg return;
7067330f729Sjoerg }
7077330f729Sjoerg
7087330f729Sjoerg // Handle jump tables.
7097330f729Sjoerg if (HiOperand.isJTI()) {
7107330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
7117330f729Sjoerg .addJumpTableIndex(HiOperand.getIndex(), HiOperand.getTargetFlags())
7127330f729Sjoerg .addImm(LoOperand.getImm());
7137330f729Sjoerg return;
7147330f729Sjoerg }
7157330f729Sjoerg if (LoOperand.isJTI()) {
7167330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
7177330f729Sjoerg .addImm(HiOperand.getImm())
7187330f729Sjoerg .addJumpTableIndex(LoOperand.getIndex(), LoOperand.getTargetFlags());
7197330f729Sjoerg return;
7207330f729Sjoerg }
7217330f729Sjoerg
7227330f729Sjoerg // Handle constant pools.
7237330f729Sjoerg if (HiOperand.isCPI()) {
7247330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
7257330f729Sjoerg .addConstantPoolIndex(HiOperand.getIndex(), HiOperand.getOffset(),
7267330f729Sjoerg HiOperand.getTargetFlags())
7277330f729Sjoerg .addImm(LoOperand.getImm());
7287330f729Sjoerg return;
7297330f729Sjoerg }
7307330f729Sjoerg if (LoOperand.isCPI()) {
7317330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
7327330f729Sjoerg .addImm(HiOperand.getImm())
7337330f729Sjoerg .addConstantPoolIndex(LoOperand.getIndex(), LoOperand.getOffset(),
7347330f729Sjoerg LoOperand.getTargetFlags());
7357330f729Sjoerg return;
7367330f729Sjoerg }
7377330f729Sjoerg
7387330f729Sjoerg // First preference should be given to Hexagon::A2_combineii instruction
7397330f729Sjoerg // as it can include U6 (in Hexagon::A4_combineii) as well.
7407330f729Sjoerg // In this instruction, HiOperand is const extended, if required.
7417330f729Sjoerg if (isInt<8>(LoOperand.getImm())) {
7427330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
7437330f729Sjoerg .addImm(HiOperand.getImm())
7447330f729Sjoerg .addImm(LoOperand.getImm());
7457330f729Sjoerg return;
7467330f729Sjoerg }
7477330f729Sjoerg
7487330f729Sjoerg // In this instruction, LoOperand is const extended, if required.
7497330f729Sjoerg if (isInt<8>(HiOperand.getImm())) {
7507330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
7517330f729Sjoerg .addImm(HiOperand.getImm())
7527330f729Sjoerg .addImm(LoOperand.getImm());
7537330f729Sjoerg return;
7547330f729Sjoerg }
7557330f729Sjoerg
7567330f729Sjoerg // Insert new combine instruction.
7577330f729Sjoerg // DoubleRegDest = combine #HiImm, #LoImm
7587330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
7597330f729Sjoerg .addImm(HiOperand.getImm())
7607330f729Sjoerg .addImm(LoOperand.getImm());
7617330f729Sjoerg }
7627330f729Sjoerg
emitCombineIR(MachineBasicBlock::iterator & InsertPt,unsigned DoubleDestReg,MachineOperand & HiOperand,MachineOperand & LoOperand)7637330f729Sjoerg void HexagonCopyToCombine::emitCombineIR(MachineBasicBlock::iterator &InsertPt,
7647330f729Sjoerg unsigned DoubleDestReg,
7657330f729Sjoerg MachineOperand &HiOperand,
7667330f729Sjoerg MachineOperand &LoOperand) {
7677330f729Sjoerg Register LoReg = LoOperand.getReg();
7687330f729Sjoerg unsigned LoRegKillFlag = getKillRegState(LoOperand.isKill());
7697330f729Sjoerg
7707330f729Sjoerg DebugLoc DL = InsertPt->getDebugLoc();
7717330f729Sjoerg MachineBasicBlock *BB = InsertPt->getParent();
7727330f729Sjoerg
7737330f729Sjoerg // Handle globals.
7747330f729Sjoerg if (HiOperand.isGlobal()) {
7757330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
7767330f729Sjoerg .addGlobalAddress(HiOperand.getGlobal(), HiOperand.getOffset(),
7777330f729Sjoerg HiOperand.getTargetFlags())
7787330f729Sjoerg .addReg(LoReg, LoRegKillFlag);
7797330f729Sjoerg return;
7807330f729Sjoerg }
7817330f729Sjoerg // Handle block addresses.
7827330f729Sjoerg if (HiOperand.isBlockAddress()) {
7837330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
7847330f729Sjoerg .addBlockAddress(HiOperand.getBlockAddress(), HiOperand.getOffset(),
7857330f729Sjoerg HiOperand.getTargetFlags())
7867330f729Sjoerg .addReg(LoReg, LoRegKillFlag);
7877330f729Sjoerg return;
7887330f729Sjoerg }
7897330f729Sjoerg // Handle jump tables.
7907330f729Sjoerg if (HiOperand.isJTI()) {
7917330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
7927330f729Sjoerg .addJumpTableIndex(HiOperand.getIndex(), HiOperand.getTargetFlags())
7937330f729Sjoerg .addReg(LoReg, LoRegKillFlag);
7947330f729Sjoerg return;
7957330f729Sjoerg }
7967330f729Sjoerg // Handle constant pools.
7977330f729Sjoerg if (HiOperand.isCPI()) {
7987330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
7997330f729Sjoerg .addConstantPoolIndex(HiOperand.getIndex(), HiOperand.getOffset(),
8007330f729Sjoerg HiOperand.getTargetFlags())
8017330f729Sjoerg .addReg(LoReg, LoRegKillFlag);
8027330f729Sjoerg return;
8037330f729Sjoerg }
8047330f729Sjoerg // Insert new combine instruction.
8057330f729Sjoerg // DoubleRegDest = combine #HiImm, LoReg
8067330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
8077330f729Sjoerg .addImm(HiOperand.getImm())
8087330f729Sjoerg .addReg(LoReg, LoRegKillFlag);
8097330f729Sjoerg }
8107330f729Sjoerg
emitCombineRI(MachineBasicBlock::iterator & InsertPt,unsigned DoubleDestReg,MachineOperand & HiOperand,MachineOperand & LoOperand)8117330f729Sjoerg void HexagonCopyToCombine::emitCombineRI(MachineBasicBlock::iterator &InsertPt,
8127330f729Sjoerg unsigned DoubleDestReg,
8137330f729Sjoerg MachineOperand &HiOperand,
8147330f729Sjoerg MachineOperand &LoOperand) {
8157330f729Sjoerg unsigned HiRegKillFlag = getKillRegState(HiOperand.isKill());
8167330f729Sjoerg Register HiReg = HiOperand.getReg();
8177330f729Sjoerg
8187330f729Sjoerg DebugLoc DL = InsertPt->getDebugLoc();
8197330f729Sjoerg MachineBasicBlock *BB = InsertPt->getParent();
8207330f729Sjoerg
8217330f729Sjoerg // Handle global.
8227330f729Sjoerg if (LoOperand.isGlobal()) {
8237330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
8247330f729Sjoerg .addReg(HiReg, HiRegKillFlag)
8257330f729Sjoerg .addGlobalAddress(LoOperand.getGlobal(), LoOperand.getOffset(),
8267330f729Sjoerg LoOperand.getTargetFlags());
8277330f729Sjoerg return;
8287330f729Sjoerg }
8297330f729Sjoerg // Handle block addresses.
8307330f729Sjoerg if (LoOperand.isBlockAddress()) {
8317330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
8327330f729Sjoerg .addReg(HiReg, HiRegKillFlag)
8337330f729Sjoerg .addBlockAddress(LoOperand.getBlockAddress(), LoOperand.getOffset(),
8347330f729Sjoerg LoOperand.getTargetFlags());
8357330f729Sjoerg return;
8367330f729Sjoerg }
8377330f729Sjoerg // Handle jump tables.
8387330f729Sjoerg if (LoOperand.isJTI()) {
8397330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
8407330f729Sjoerg .addReg(HiOperand.getReg(), HiRegKillFlag)
8417330f729Sjoerg .addJumpTableIndex(LoOperand.getIndex(), LoOperand.getTargetFlags());
8427330f729Sjoerg return;
8437330f729Sjoerg }
8447330f729Sjoerg // Handle constant pools.
8457330f729Sjoerg if (LoOperand.isCPI()) {
8467330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
8477330f729Sjoerg .addReg(HiOperand.getReg(), HiRegKillFlag)
8487330f729Sjoerg .addConstantPoolIndex(LoOperand.getIndex(), LoOperand.getOffset(),
8497330f729Sjoerg LoOperand.getTargetFlags());
8507330f729Sjoerg return;
8517330f729Sjoerg }
8527330f729Sjoerg
8537330f729Sjoerg // Insert new combine instruction.
8547330f729Sjoerg // DoubleRegDest = combine HiReg, #LoImm
8557330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
8567330f729Sjoerg .addReg(HiReg, HiRegKillFlag)
8577330f729Sjoerg .addImm(LoOperand.getImm());
8587330f729Sjoerg }
8597330f729Sjoerg
emitCombineRR(MachineBasicBlock::iterator & InsertPt,unsigned DoubleDestReg,MachineOperand & HiOperand,MachineOperand & LoOperand)8607330f729Sjoerg void HexagonCopyToCombine::emitCombineRR(MachineBasicBlock::iterator &InsertPt,
8617330f729Sjoerg unsigned DoubleDestReg,
8627330f729Sjoerg MachineOperand &HiOperand,
8637330f729Sjoerg MachineOperand &LoOperand) {
8647330f729Sjoerg unsigned LoRegKillFlag = getKillRegState(LoOperand.isKill());
8657330f729Sjoerg unsigned HiRegKillFlag = getKillRegState(HiOperand.isKill());
8667330f729Sjoerg Register LoReg = LoOperand.getReg();
8677330f729Sjoerg Register HiReg = HiOperand.getReg();
8687330f729Sjoerg
8697330f729Sjoerg DebugLoc DL = InsertPt->getDebugLoc();
8707330f729Sjoerg MachineBasicBlock *BB = InsertPt->getParent();
8717330f729Sjoerg
8727330f729Sjoerg // Insert new combine instruction.
8737330f729Sjoerg // DoubleRegDest = combine HiReg, LoReg
8747330f729Sjoerg unsigned NewOpc;
8757330f729Sjoerg if (Hexagon::DoubleRegsRegClass.contains(DoubleDestReg)) {
8767330f729Sjoerg NewOpc = Hexagon::A2_combinew;
8777330f729Sjoerg } else if (Hexagon::HvxWRRegClass.contains(DoubleDestReg)) {
8787330f729Sjoerg assert(ST->useHVXOps());
8797330f729Sjoerg NewOpc = Hexagon::V6_vcombine;
8807330f729Sjoerg } else
8817330f729Sjoerg llvm_unreachable("Unexpected register");
8827330f729Sjoerg
8837330f729Sjoerg BuildMI(*BB, InsertPt, DL, TII->get(NewOpc), DoubleDestReg)
8847330f729Sjoerg .addReg(HiReg, HiRegKillFlag)
8857330f729Sjoerg .addReg(LoReg, LoRegKillFlag);
8867330f729Sjoerg }
8877330f729Sjoerg
createHexagonCopyToCombine()8887330f729Sjoerg FunctionPass *llvm::createHexagonCopyToCombine() {
8897330f729Sjoerg return new HexagonCopyToCombine();
8907330f729Sjoerg }
891