//===- NVPTXRegisterInfo.cpp - NVPTX Register Information -----------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file contains the NVPTX implementation of the TargetRegisterInfo class. // //===----------------------------------------------------------------------===// #include "NVPTXRegisterInfo.h" #include "MCTargetDesc/NVPTXInstPrinter.h" #include "NVPTX.h" #include "NVPTXTargetMachine.h" #include "llvm/ADT/BitVector.h" #include "llvm/CodeGen/MachineFrameInfo.h" #include "llvm/CodeGen/MachineFunction.h" #include "llvm/CodeGen/TargetInstrInfo.h" using namespace llvm; #define DEBUG_TYPE "nvptx-reg-info" namespace llvm { StringRef getNVPTXRegClassName(TargetRegisterClass const *RC) { if (RC == &NVPTX::B128RegClass) return ".b128"; if (RC == &NVPTX::B64RegClass) // We use untyped (.b) integer registers here as NVCC does. // Correctness of generated code does not depend on register type, // but using .s/.u registers runs into ptxas bug that prevents // assembly of otherwise valid PTX into SASS. Despite PTX ISA // specifying only argument size for fp16 instructions, ptxas does // not allow using .s16 or .u16 arguments for .fp16 // instructions. At the same time it allows using .s32/.u32 // arguments for .fp16v2 instructions: // // .reg .b16 rb16 // .reg .s16 rs16 // add.f16 rb16,rb16,rb16; // OK // add.f16 rs16,rs16,rs16; // Arguments mismatch for instruction 'add' // but: // .reg .b32 rb32 // .reg .s32 rs32 // add.f16v2 rb32,rb32,rb32; // OK // add.f16v2 rs32,rs32,rs32; // OK return ".b64"; if (RC == &NVPTX::B32RegClass) return ".b32"; if (RC == &NVPTX::B16RegClass) return ".b16"; if (RC == &NVPTX::B1RegClass) return ".pred"; if (RC == &NVPTX::SpecialRegsRegClass) return "!Special!"; return "INTERNAL"; } StringRef getNVPTXRegClassStr(TargetRegisterClass const *RC) { if (RC == &NVPTX::B128RegClass) return "%rq"; if (RC == &NVPTX::B64RegClass) return "%rd"; if (RC == &NVPTX::B32RegClass) return "%r"; if (RC == &NVPTX::B16RegClass) return "%rs"; if (RC == &NVPTX::B1RegClass) return "%p"; if (RC == &NVPTX::SpecialRegsRegClass) return "!Special!"; return "INTERNAL"; } } // namespace llvm NVPTXRegisterInfo::NVPTXRegisterInfo() : NVPTXGenRegisterInfo(0), StrPool(StrAlloc) {} #define GET_REGINFO_TARGET_DESC #include "NVPTXGenRegisterInfo.inc" /// NVPTX Callee Saved Registers const MCPhysReg * NVPTXRegisterInfo::getCalleeSavedRegs(const MachineFunction *) const { static const MCPhysReg CalleeSavedRegs[] = { 0 }; return CalleeSavedRegs; } BitVector NVPTXRegisterInfo::getReservedRegs(const MachineFunction &MF) const { BitVector Reserved(getNumRegs()); for (unsigned Reg = NVPTX::ENVREG0; Reg <= NVPTX::ENVREG31; ++Reg) { markSuperRegs(Reserved, Reg); } markSuperRegs(Reserved, NVPTX::VRFrame32); markSuperRegs(Reserved, NVPTX::VRFrameLocal32); markSuperRegs(Reserved, NVPTX::VRFrame64); markSuperRegs(Reserved, NVPTX::VRFrameLocal64); markSuperRegs(Reserved, NVPTX::VRDepot); return Reserved; } bool NVPTXRegisterInfo::eliminateFrameIndex(MachineBasicBlock::iterator II, int SPAdj, unsigned FIOperandNum, RegScavenger *) const { assert(SPAdj == 0 && "Unexpected"); MachineInstr &MI = *II; if (MI.isLifetimeMarker()) { MI.eraseFromParent(); return true; } const int FrameIndex = MI.getOperand(FIOperandNum).getIndex(); const MachineFunction &MF = *MI.getParent()->getParent(); const int Offset = MF.getFrameInfo().getObjectOffset(FrameIndex) + MI.getOperand(FIOperandNum + 1).getImm(); // Using I0 as the frame pointer MI.getOperand(FIOperandNum).ChangeToRegister(getFrameRegister(MF), false); MI.getOperand(FIOperandNum + 1).ChangeToImmediate(Offset); return false; } Register NVPTXRegisterInfo::getFrameRegister(const MachineFunction &MF) const { const NVPTXTargetMachine &TM = static_cast(MF.getTarget()); return TM.is64Bit() ? NVPTX::VRFrame64 : NVPTX::VRFrame32; } Register NVPTXRegisterInfo::getFrameLocalRegister(const MachineFunction &MF) const { const NVPTXTargetMachine &TM = static_cast(MF.getTarget()); return TM.is64Bit() ? NVPTX::VRFrameLocal64 : NVPTX::VRFrameLocal32; } void NVPTXRegisterInfo::clearDebugRegisterMap() const { debugRegisterMap.clear(); } static uint64_t encodeRegisterForDwarf(StringRef RegisterName) { if (RegisterName.size() > 8) // The name is more than 8 characters long, and so won't fit into 64 bits. return 0; // Encode the name string into a DWARF register number using cuda-gdb's // encoding. See cuda_check_dwarf2_reg_ptx_virtual_register in cuda-tdep.c, // https://github.com/NVIDIA/cuda-gdb/blob/e5cf3bddae520ffb326f95b4d98ce5c7474b828b/gdb/cuda/cuda-tdep.c#L353 // IE the bytes of the string are concatenated in reverse into a single // number, which is stored in ULEB128, but in practice must be no more than 8 // bytes (excluding null terminator, which is not included). uint64_t result = 0; for (unsigned char c : RegisterName) result = (result << 8) | c; return result; } void NVPTXRegisterInfo::addToDebugRegisterMap( uint64_t preEncodedVirtualRegister, StringRef RegisterName) const { uint64_t mapped = encodeRegisterForDwarf(RegisterName); if (mapped == 0) return; debugRegisterMap.insert({preEncodedVirtualRegister, mapped}); } int64_t NVPTXRegisterInfo::getDwarfRegNum(MCRegister RegNum, bool isEH) const { StringRef Name = NVPTXInstPrinter::getRegisterName(RegNum.id()); // In NVPTXFrameLowering.cpp, we do arrange for %Depot to be accessible from // %SP. Using the %Depot register doesn't provide any debug info in // cuda-gdb, but switching it to %SP does. if (RegNum.id() == NVPTX::VRDepot) Name = "%SP"; return encodeRegisterForDwarf(Name); } int64_t NVPTXRegisterInfo::getDwarfRegNumForVirtReg(Register RegNum, bool isEH) const { assert(RegNum.isVirtual()); uint64_t lookup = debugRegisterMap.lookup(RegNum.id()); if (lookup) return lookup; return -1; }