109467b48Spatrick //===- NVPTXRegisterInfo.cpp - NVPTX Register Information -----------------===//
209467b48Spatrick //
309467b48Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
409467b48Spatrick // See https://llvm.org/LICENSE.txt for license information.
509467b48Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
609467b48Spatrick //
709467b48Spatrick //===----------------------------------------------------------------------===//
809467b48Spatrick //
909467b48Spatrick // This file contains the NVPTX implementation of the TargetRegisterInfo class.
1009467b48Spatrick //
1109467b48Spatrick //===----------------------------------------------------------------------===//
1209467b48Spatrick
1309467b48Spatrick #include "NVPTXRegisterInfo.h"
1409467b48Spatrick #include "NVPTX.h"
1509467b48Spatrick #include "NVPTXSubtarget.h"
16*d415bd75Srobert #include "NVPTXTargetMachine.h"
1709467b48Spatrick #include "llvm/ADT/BitVector.h"
1809467b48Spatrick #include "llvm/CodeGen/MachineFrameInfo.h"
1909467b48Spatrick #include "llvm/CodeGen/MachineFunction.h"
2009467b48Spatrick #include "llvm/CodeGen/MachineInstrBuilder.h"
2109467b48Spatrick #include "llvm/CodeGen/TargetInstrInfo.h"
2209467b48Spatrick #include "llvm/MC/MachineLocation.h"
2309467b48Spatrick
2409467b48Spatrick using namespace llvm;
2509467b48Spatrick
2609467b48Spatrick #define DEBUG_TYPE "nvptx-reg-info"
2709467b48Spatrick
2809467b48Spatrick namespace llvm {
getNVPTXRegClassName(TargetRegisterClass const * RC)2909467b48Spatrick std::string getNVPTXRegClassName(TargetRegisterClass const *RC) {
3009467b48Spatrick if (RC == &NVPTX::Float32RegsRegClass)
3109467b48Spatrick return ".f32";
3209467b48Spatrick if (RC == &NVPTX::Float16RegsRegClass)
3309467b48Spatrick // Ideally fp16 registers should be .f16, but this syntax is only
3409467b48Spatrick // supported on sm_53+. On the other hand, .b16 registers are
3509467b48Spatrick // accepted for all supported fp16 instructions on all GPU
3609467b48Spatrick // variants, so we can use them instead.
3709467b48Spatrick return ".b16";
3809467b48Spatrick if (RC == &NVPTX::Float16x2RegsRegClass)
3909467b48Spatrick return ".b32";
4009467b48Spatrick if (RC == &NVPTX::Float64RegsRegClass)
4109467b48Spatrick return ".f64";
4209467b48Spatrick if (RC == &NVPTX::Int64RegsRegClass)
4309467b48Spatrick // We use untyped (.b) integer registers here as NVCC does.
4409467b48Spatrick // Correctness of generated code does not depend on register type,
4509467b48Spatrick // but using .s/.u registers runs into ptxas bug that prevents
4609467b48Spatrick // assembly of otherwise valid PTX into SASS. Despite PTX ISA
4709467b48Spatrick // specifying only argument size for fp16 instructions, ptxas does
4809467b48Spatrick // not allow using .s16 or .u16 arguments for .fp16
4909467b48Spatrick // instructions. At the same time it allows using .s32/.u32
5009467b48Spatrick // arguments for .fp16v2 instructions:
5109467b48Spatrick //
5209467b48Spatrick // .reg .b16 rb16
5309467b48Spatrick // .reg .s16 rs16
5409467b48Spatrick // add.f16 rb16,rb16,rb16; // OK
5509467b48Spatrick // add.f16 rs16,rs16,rs16; // Arguments mismatch for instruction 'add'
5609467b48Spatrick // but:
5709467b48Spatrick // .reg .b32 rb32
5809467b48Spatrick // .reg .s32 rs32
5909467b48Spatrick // add.f16v2 rb32,rb32,rb32; // OK
6009467b48Spatrick // add.f16v2 rs32,rs32,rs32; // OK
6109467b48Spatrick return ".b64";
6209467b48Spatrick if (RC == &NVPTX::Int32RegsRegClass)
6309467b48Spatrick return ".b32";
6409467b48Spatrick if (RC == &NVPTX::Int16RegsRegClass)
6509467b48Spatrick return ".b16";
6609467b48Spatrick if (RC == &NVPTX::Int1RegsRegClass)
6709467b48Spatrick return ".pred";
6809467b48Spatrick if (RC == &NVPTX::SpecialRegsRegClass)
6909467b48Spatrick return "!Special!";
7009467b48Spatrick return "INTERNAL";
7109467b48Spatrick }
7209467b48Spatrick
getNVPTXRegClassStr(TargetRegisterClass const * RC)7309467b48Spatrick std::string getNVPTXRegClassStr(TargetRegisterClass const *RC) {
7409467b48Spatrick if (RC == &NVPTX::Float32RegsRegClass)
7509467b48Spatrick return "%f";
7609467b48Spatrick if (RC == &NVPTX::Float16RegsRegClass)
7709467b48Spatrick return "%h";
7809467b48Spatrick if (RC == &NVPTX::Float16x2RegsRegClass)
7909467b48Spatrick return "%hh";
8009467b48Spatrick if (RC == &NVPTX::Float64RegsRegClass)
8109467b48Spatrick return "%fd";
8209467b48Spatrick if (RC == &NVPTX::Int64RegsRegClass)
8309467b48Spatrick return "%rd";
8409467b48Spatrick if (RC == &NVPTX::Int32RegsRegClass)
8509467b48Spatrick return "%r";
8609467b48Spatrick if (RC == &NVPTX::Int16RegsRegClass)
8709467b48Spatrick return "%rs";
8809467b48Spatrick if (RC == &NVPTX::Int1RegsRegClass)
8909467b48Spatrick return "%p";
9009467b48Spatrick if (RC == &NVPTX::SpecialRegsRegClass)
9109467b48Spatrick return "!Special!";
9209467b48Spatrick return "INTERNAL";
9309467b48Spatrick }
9409467b48Spatrick }
9509467b48Spatrick
NVPTXRegisterInfo()96*d415bd75Srobert NVPTXRegisterInfo::NVPTXRegisterInfo()
97*d415bd75Srobert : NVPTXGenRegisterInfo(0), StrPool(StrAlloc) {}
9809467b48Spatrick
9909467b48Spatrick #define GET_REGINFO_TARGET_DESC
10009467b48Spatrick #include "NVPTXGenRegisterInfo.inc"
10109467b48Spatrick
10209467b48Spatrick /// NVPTX Callee Saved Registers
10309467b48Spatrick const MCPhysReg *
getCalleeSavedRegs(const MachineFunction *) const10409467b48Spatrick NVPTXRegisterInfo::getCalleeSavedRegs(const MachineFunction *) const {
10509467b48Spatrick static const MCPhysReg CalleeSavedRegs[] = { 0 };
10609467b48Spatrick return CalleeSavedRegs;
10709467b48Spatrick }
10809467b48Spatrick
getReservedRegs(const MachineFunction & MF) const10909467b48Spatrick BitVector NVPTXRegisterInfo::getReservedRegs(const MachineFunction &MF) const {
11009467b48Spatrick BitVector Reserved(getNumRegs());
111*d415bd75Srobert for (unsigned Reg = NVPTX::ENVREG0; Reg <= NVPTX::ENVREG31; ++Reg) {
112*d415bd75Srobert markSuperRegs(Reserved, Reg);
113*d415bd75Srobert }
114*d415bd75Srobert markSuperRegs(Reserved, NVPTX::VRFrame32);
115*d415bd75Srobert markSuperRegs(Reserved, NVPTX::VRFrameLocal32);
116*d415bd75Srobert markSuperRegs(Reserved, NVPTX::VRFrame64);
117*d415bd75Srobert markSuperRegs(Reserved, NVPTX::VRFrameLocal64);
118*d415bd75Srobert markSuperRegs(Reserved, NVPTX::VRDepot);
11909467b48Spatrick return Reserved;
12009467b48Spatrick }
12109467b48Spatrick
eliminateFrameIndex(MachineBasicBlock::iterator II,int SPAdj,unsigned FIOperandNum,RegScavenger * RS) const122*d415bd75Srobert bool NVPTXRegisterInfo::eliminateFrameIndex(MachineBasicBlock::iterator II,
12309467b48Spatrick int SPAdj, unsigned FIOperandNum,
12409467b48Spatrick RegScavenger *RS) const {
12509467b48Spatrick assert(SPAdj == 0 && "Unexpected");
12609467b48Spatrick
12709467b48Spatrick MachineInstr &MI = *II;
12809467b48Spatrick int FrameIndex = MI.getOperand(FIOperandNum).getIndex();
12909467b48Spatrick
13009467b48Spatrick MachineFunction &MF = *MI.getParent()->getParent();
13109467b48Spatrick int Offset = MF.getFrameInfo().getObjectOffset(FrameIndex) +
13209467b48Spatrick MI.getOperand(FIOperandNum + 1).getImm();
13309467b48Spatrick
13409467b48Spatrick // Using I0 as the frame pointer
135*d415bd75Srobert MI.getOperand(FIOperandNum).ChangeToRegister(getFrameRegister(MF), false);
13609467b48Spatrick MI.getOperand(FIOperandNum + 1).ChangeToImmediate(Offset);
137*d415bd75Srobert return false;
13809467b48Spatrick }
13909467b48Spatrick
getFrameRegister(const MachineFunction & MF) const14009467b48Spatrick Register NVPTXRegisterInfo::getFrameRegister(const MachineFunction &MF) const {
141*d415bd75Srobert const NVPTXTargetMachine &TM =
142*d415bd75Srobert static_cast<const NVPTXTargetMachine &>(MF.getTarget());
143*d415bd75Srobert return TM.is64Bit() ? NVPTX::VRFrame64 : NVPTX::VRFrame32;
144*d415bd75Srobert }
145*d415bd75Srobert
146*d415bd75Srobert Register
getFrameLocalRegister(const MachineFunction & MF) const147*d415bd75Srobert NVPTXRegisterInfo::getFrameLocalRegister(const MachineFunction &MF) const {
148*d415bd75Srobert const NVPTXTargetMachine &TM =
149*d415bd75Srobert static_cast<const NVPTXTargetMachine &>(MF.getTarget());
150*d415bd75Srobert return TM.is64Bit() ? NVPTX::VRFrameLocal64 : NVPTX::VRFrameLocal32;
15109467b48Spatrick }
152