123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208 |
- //===- Localizer.cpp ---------------------- Localize some instrs -*- C++ -*-==//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- /// \file
- /// This file implements the Localizer class.
- //===----------------------------------------------------------------------===//
- #include "llvm/CodeGen/GlobalISel/Localizer.h"
- #include "llvm/ADT/DenseMap.h"
- #include "llvm/ADT/STLExtras.h"
- #include "llvm/Analysis/TargetTransformInfo.h"
- #include "llvm/CodeGen/MachineRegisterInfo.h"
- #include "llvm/CodeGen/TargetLowering.h"
- #include "llvm/InitializePasses.h"
- #include "llvm/Support/Debug.h"
- #define DEBUG_TYPE "localizer"
- using namespace llvm;
- char Localizer::ID = 0;
- INITIALIZE_PASS_BEGIN(Localizer, DEBUG_TYPE,
- "Move/duplicate certain instructions close to their use",
- false, false)
- INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass)
- INITIALIZE_PASS_END(Localizer, DEBUG_TYPE,
- "Move/duplicate certain instructions close to their use",
- false, false)
- Localizer::Localizer(std::function<bool(const MachineFunction &)> F)
- : MachineFunctionPass(ID), DoNotRunPass(F) {}
- Localizer::Localizer()
- : Localizer([](const MachineFunction &) { return false; }) {}
- void Localizer::init(MachineFunction &MF) {
- MRI = &MF.getRegInfo();
- TTI = &getAnalysis<TargetTransformInfoWrapperPass>().getTTI(MF.getFunction());
- }
- void Localizer::getAnalysisUsage(AnalysisUsage &AU) const {
- AU.addRequired<TargetTransformInfoWrapperPass>();
- getSelectionDAGFallbackAnalysisUsage(AU);
- MachineFunctionPass::getAnalysisUsage(AU);
- }
- bool Localizer::isLocalUse(MachineOperand &MOUse, const MachineInstr &Def,
- MachineBasicBlock *&InsertMBB) {
- MachineInstr &MIUse = *MOUse.getParent();
- InsertMBB = MIUse.getParent();
- if (MIUse.isPHI())
- InsertMBB = MIUse.getOperand(MIUse.getOperandNo(&MOUse) + 1).getMBB();
- return InsertMBB == Def.getParent();
- }
- bool Localizer::isNonUniquePhiValue(MachineOperand &Op) const {
- MachineInstr *MI = Op.getParent();
- if (!MI->isPHI())
- return false;
- Register SrcReg = Op.getReg();
- for (unsigned Idx = 1; Idx < MI->getNumOperands(); Idx += 2) {
- auto &MO = MI->getOperand(Idx);
- if (&MO != &Op && MO.isReg() && MO.getReg() == SrcReg)
- return true;
- }
- return false;
- }
- bool Localizer::localizeInterBlock(MachineFunction &MF,
- LocalizedSetVecT &LocalizedInstrs) {
- bool Changed = false;
- DenseMap<std::pair<MachineBasicBlock *, unsigned>, unsigned> MBBWithLocalDef;
- // Since the IRTranslator only emits constants into the entry block, and the
- // rest of the GISel pipeline generally emits constants close to their users,
- // we only localize instructions in the entry block here. This might change if
- // we start doing CSE across blocks.
- auto &MBB = MF.front();
- auto &TL = *MF.getSubtarget().getTargetLowering();
- for (MachineInstr &MI : llvm::reverse(MBB)) {
- if (!TL.shouldLocalize(MI, TTI))
- continue;
- LLVM_DEBUG(dbgs() << "Should localize: " << MI);
- assert(MI.getDesc().getNumDefs() == 1 &&
- "More than one definition not supported yet");
- Register Reg = MI.getOperand(0).getReg();
- // Check if all the users of MI are local.
- // We are going to invalidation the list of use operands, so we
- // can't use range iterator.
- for (MachineOperand &MOUse :
- llvm::make_early_inc_range(MRI->use_operands(Reg))) {
- // Check if the use is already local.
- MachineBasicBlock *InsertMBB;
- LLVM_DEBUG(MachineInstr &MIUse = *MOUse.getParent();
- dbgs() << "Checking use: " << MIUse
- << " #Opd: " << MIUse.getOperandNo(&MOUse) << '\n');
- if (isLocalUse(MOUse, MI, InsertMBB)) {
- // Even if we're in the same block, if the block is very large we could
- // still have many long live ranges. Try to do intra-block localization
- // too.
- LocalizedInstrs.insert(&MI);
- continue;
- }
- // If the use is a phi operand that's not unique, don't try to localize.
- // If we do, we can cause unnecessary instruction bloat by duplicating
- // into each predecessor block, when the existing one is sufficient and
- // allows for easier optimization later.
- if (isNonUniquePhiValue(MOUse))
- continue;
- LLVM_DEBUG(dbgs() << "Fixing non-local use\n");
- Changed = true;
- auto MBBAndReg = std::make_pair(InsertMBB, Reg);
- auto NewVRegIt = MBBWithLocalDef.find(MBBAndReg);
- if (NewVRegIt == MBBWithLocalDef.end()) {
- // Create the localized instruction.
- MachineInstr *LocalizedMI = MF.CloneMachineInstr(&MI);
- LocalizedInstrs.insert(LocalizedMI);
- MachineInstr &UseMI = *MOUse.getParent();
- if (MRI->hasOneUse(Reg) && !UseMI.isPHI())
- InsertMBB->insert(UseMI, LocalizedMI);
- else
- InsertMBB->insert(InsertMBB->SkipPHIsAndLabels(InsertMBB->begin()),
- LocalizedMI);
- // Set a new register for the definition.
- Register NewReg = MRI->cloneVirtualRegister(Reg);
- LocalizedMI->getOperand(0).setReg(NewReg);
- NewVRegIt =
- MBBWithLocalDef.insert(std::make_pair(MBBAndReg, NewReg)).first;
- LLVM_DEBUG(dbgs() << "Inserted: " << *LocalizedMI);
- }
- LLVM_DEBUG(dbgs() << "Update use with: " << printReg(NewVRegIt->second)
- << '\n');
- // Update the user reg.
- MOUse.setReg(NewVRegIt->second);
- }
- }
- return Changed;
- }
- bool Localizer::localizeIntraBlock(LocalizedSetVecT &LocalizedInstrs) {
- bool Changed = false;
- // For each already-localized instruction which has multiple users, then we
- // scan the block top down from the current position until we hit one of them.
- // FIXME: Consider doing inst duplication if live ranges are very long due to
- // many users, but this case may be better served by regalloc improvements.
- for (MachineInstr *MI : LocalizedInstrs) {
- Register Reg = MI->getOperand(0).getReg();
- MachineBasicBlock &MBB = *MI->getParent();
- // All of the user MIs of this reg.
- SmallPtrSet<MachineInstr *, 32> Users;
- for (MachineInstr &UseMI : MRI->use_nodbg_instructions(Reg)) {
- if (!UseMI.isPHI())
- Users.insert(&UseMI);
- }
- // If all the users were PHIs then they're not going to be in our block,
- // don't try to move this instruction.
- if (Users.empty())
- continue;
- MachineBasicBlock::iterator II(MI);
- ++II;
- while (II != MBB.end() && !Users.count(&*II))
- ++II;
- assert(II != MBB.end() && "Didn't find the user in the MBB");
- LLVM_DEBUG(dbgs() << "Intra-block: moving " << *MI << " before " << *II
- << '\n');
- MI->removeFromParent();
- MBB.insert(II, MI);
- Changed = true;
- }
- return Changed;
- }
- bool Localizer::runOnMachineFunction(MachineFunction &MF) {
- // If the ISel pipeline failed, do not bother running that pass.
- if (MF.getProperties().hasProperty(
- MachineFunctionProperties::Property::FailedISel))
- return false;
- // Don't run the pass if the target asked so.
- if (DoNotRunPass(MF))
- return false;
- LLVM_DEBUG(dbgs() << "Localize instructions for: " << MF.getName() << '\n');
- init(MF);
- // Keep track of the instructions we localized. We'll do a second pass of
- // intra-block localization to further reduce live ranges.
- LocalizedSetVecT LocalizedInstrs;
- bool Changed = localizeInterBlock(MF, LocalizedInstrs);
- Changed |= localizeIntraBlock(LocalizedInstrs);
- return Changed;
- }
|