123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216 |
- //===-- RegUsageInfoCollector.cpp - Register Usage Information Collector --===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- ///
- /// This pass is required to take advantage of the interprocedural register
- /// allocation infrastructure.
- ///
- /// This pass is simple MachineFunction pass which collects register usage
- /// details by iterating through each physical registers and checking
- /// MRI::isPhysRegUsed() then creates a RegMask based on this details.
- /// The pass then stores this RegMask in PhysicalRegisterUsageInfo.cpp
- ///
- //===----------------------------------------------------------------------===//
- #include "llvm/ADT/Statistic.h"
- #include "llvm/CodeGen/MachineBasicBlock.h"
- #include "llvm/CodeGen/MachineFunctionPass.h"
- #include "llvm/CodeGen/MachineInstr.h"
- #include "llvm/CodeGen/MachineOperand.h"
- #include "llvm/CodeGen/MachineRegisterInfo.h"
- #include "llvm/CodeGen/Passes.h"
- #include "llvm/CodeGen/RegisterUsageInfo.h"
- #include "llvm/Support/Debug.h"
- #include "llvm/Support/raw_ostream.h"
- #include "llvm/CodeGen/TargetFrameLowering.h"
- using namespace llvm;
- #define DEBUG_TYPE "ip-regalloc"
- STATISTIC(NumCSROpt,
- "Number of functions optimized for callee saved registers");
- namespace {
- class RegUsageInfoCollector : public MachineFunctionPass {
- public:
- RegUsageInfoCollector() : MachineFunctionPass(ID) {
- PassRegistry &Registry = *PassRegistry::getPassRegistry();
- initializeRegUsageInfoCollectorPass(Registry);
- }
- StringRef getPassName() const override {
- return "Register Usage Information Collector Pass";
- }
- void getAnalysisUsage(AnalysisUsage &AU) const override {
- AU.addRequired<PhysicalRegisterUsageInfo>();
- AU.setPreservesAll();
- MachineFunctionPass::getAnalysisUsage(AU);
- }
- bool runOnMachineFunction(MachineFunction &MF) override;
- // Call getCalleeSaves and then also set the bits for subregs and
- // fully saved superregs.
- static void computeCalleeSavedRegs(BitVector &SavedRegs, MachineFunction &MF);
- static char ID;
- };
- } // end of anonymous namespace
- char RegUsageInfoCollector::ID = 0;
- INITIALIZE_PASS_BEGIN(RegUsageInfoCollector, "RegUsageInfoCollector",
- "Register Usage Information Collector", false, false)
- INITIALIZE_PASS_DEPENDENCY(PhysicalRegisterUsageInfo)
- INITIALIZE_PASS_END(RegUsageInfoCollector, "RegUsageInfoCollector",
- "Register Usage Information Collector", false, false)
- FunctionPass *llvm::createRegUsageInfoCollector() {
- return new RegUsageInfoCollector();
- }
- // TODO: Move to hook somwehere?
- // Return true if it is useful to track the used registers for IPRA / no CSR
- // optimizations. This is not useful for entry points, and computing the
- // register usage information is expensive.
- static bool isCallableFunction(const MachineFunction &MF) {
- switch (MF.getFunction().getCallingConv()) {
- case CallingConv::AMDGPU_VS:
- case CallingConv::AMDGPU_GS:
- case CallingConv::AMDGPU_PS:
- case CallingConv::AMDGPU_CS:
- case CallingConv::AMDGPU_HS:
- case CallingConv::AMDGPU_ES:
- case CallingConv::AMDGPU_LS:
- case CallingConv::AMDGPU_KERNEL:
- return false;
- default:
- return true;
- }
- }
- bool RegUsageInfoCollector::runOnMachineFunction(MachineFunction &MF) {
- MachineRegisterInfo *MRI = &MF.getRegInfo();
- const TargetRegisterInfo *TRI = MF.getSubtarget().getRegisterInfo();
- const LLVMTargetMachine &TM = MF.getTarget();
- LLVM_DEBUG(dbgs() << " -------------------- " << getPassName()
- << " -------------------- \nFunction Name : "
- << MF.getName() << '\n');
- // Analyzing the register usage may be expensive on some targets.
- if (!isCallableFunction(MF)) {
- LLVM_DEBUG(dbgs() << "Not analyzing non-callable function\n");
- return false;
- }
- // If there are no callers, there's no point in computing more precise
- // register usage here.
- if (MF.getFunction().use_empty()) {
- LLVM_DEBUG(dbgs() << "Not analyzing function with no callers\n");
- return false;
- }
- std::vector<uint32_t> RegMask;
- // Compute the size of the bit vector to represent all the registers.
- // The bit vector is broken into 32-bit chunks, thus takes the ceil of
- // the number of registers divided by 32 for the size.
- unsigned RegMaskSize = MachineOperand::getRegMaskSize(TRI->getNumRegs());
- RegMask.resize(RegMaskSize, ~((uint32_t)0));
- const Function &F = MF.getFunction();
- PhysicalRegisterUsageInfo &PRUI = getAnalysis<PhysicalRegisterUsageInfo>();
- PRUI.setTargetMachine(TM);
- LLVM_DEBUG(dbgs() << "Clobbered Registers: ");
- BitVector SavedRegs;
- computeCalleeSavedRegs(SavedRegs, MF);
- const BitVector &UsedPhysRegsMask = MRI->getUsedPhysRegsMask();
- auto SetRegAsDefined = [&RegMask] (unsigned Reg) {
- RegMask[Reg / 32] &= ~(1u << Reg % 32);
- };
- // Some targets can clobber registers "inside" a call, typically in
- // linker-generated code.
- for (const MCPhysReg Reg : TRI->getIntraCallClobberedRegs(&MF))
- for (MCRegAliasIterator AI(Reg, TRI, true); AI.isValid(); ++AI)
- SetRegAsDefined(*AI);
- // Scan all the physical registers. When a register is defined in the current
- // function set it and all the aliasing registers as defined in the regmask.
- // FIXME: Rewrite to use regunits.
- for (unsigned PReg = 1, PRegE = TRI->getNumRegs(); PReg < PRegE; ++PReg) {
- // Don't count registers that are saved and restored.
- if (SavedRegs.test(PReg))
- continue;
- // If a register is defined by an instruction mark it as defined together
- // with all it's unsaved aliases.
- if (!MRI->def_empty(PReg)) {
- for (MCRegAliasIterator AI(PReg, TRI, true); AI.isValid(); ++AI)
- if (!SavedRegs.test(*AI))
- SetRegAsDefined(*AI);
- continue;
- }
- // If a register is in the UsedPhysRegsMask set then mark it as defined.
- // All clobbered aliases will also be in the set, so we can skip setting
- // as defined all the aliases here.
- if (UsedPhysRegsMask.test(PReg))
- SetRegAsDefined(PReg);
- }
- if (TargetFrameLowering::isSafeForNoCSROpt(F) &&
- MF.getSubtarget().getFrameLowering()->isProfitableForNoCSROpt(F)) {
- ++NumCSROpt;
- LLVM_DEBUG(dbgs() << MF.getName()
- << " function optimized for not having CSR.\n");
- }
- LLVM_DEBUG(
- for (unsigned PReg = 1, PRegE = TRI->getNumRegs(); PReg < PRegE; ++PReg) {
- if (MachineOperand::clobbersPhysReg(&(RegMask[0]), PReg))
- dbgs() << printReg(PReg, TRI) << " ";
- }
- dbgs() << " \n----------------------------------------\n";
- );
- PRUI.storeUpdateRegUsageInfo(F, RegMask);
- return false;
- }
- void RegUsageInfoCollector::
- computeCalleeSavedRegs(BitVector &SavedRegs, MachineFunction &MF) {
- const TargetFrameLowering &TFI = *MF.getSubtarget().getFrameLowering();
- const TargetRegisterInfo &TRI = *MF.getSubtarget().getRegisterInfo();
- // Target will return the set of registers that it saves/restores as needed.
- SavedRegs.clear();
- TFI.getCalleeSaves(MF, SavedRegs);
- if (SavedRegs.none())
- return;
- // Insert subregs.
- const MCPhysReg *CSRegs = TRI.getCalleeSavedRegs(&MF);
- for (unsigned i = 0; CSRegs[i]; ++i) {
- MCPhysReg Reg = CSRegs[i];
- if (SavedRegs.test(Reg)) {
- // Save subregisters
- for (MCSubRegIterator SR(Reg, &TRI); SR.isValid(); ++SR)
- SavedRegs.set(*SR);
- }
- }
- }
|