123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310 |
- //===-- Thumb2ITBlockPass.cpp - Insert Thumb-2 IT blocks ------------------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- #include "ARM.h"
- #include "ARMMachineFunctionInfo.h"
- #include "ARMSubtarget.h"
- #include "MCTargetDesc/ARMBaseInfo.h"
- #include "Thumb2InstrInfo.h"
- #include "llvm/ADT/SmallSet.h"
- #include "llvm/ADT/SmallVector.h"
- #include "llvm/ADT/Statistic.h"
- #include "llvm/ADT/StringRef.h"
- #include "llvm/CodeGen/MachineBasicBlock.h"
- #include "llvm/CodeGen/MachineFunction.h"
- #include "llvm/CodeGen/MachineFunctionPass.h"
- #include "llvm/CodeGen/MachineInstr.h"
- #include "llvm/CodeGen/MachineInstrBuilder.h"
- #include "llvm/CodeGen/MachineInstrBundle.h"
- #include "llvm/CodeGen/MachineOperand.h"
- #include "llvm/IR/DebugLoc.h"
- #include "llvm/MC/MCInstrDesc.h"
- #include "llvm/MC/MCRegisterInfo.h"
- #include <cassert>
- #include <new>
- using namespace llvm;
- #define DEBUG_TYPE "thumb2-it"
- #define PASS_NAME "Thumb IT blocks insertion pass"
- STATISTIC(NumITs, "Number of IT blocks inserted");
- STATISTIC(NumMovedInsts, "Number of predicated instructions moved");
- using RegisterSet = SmallSet<unsigned, 4>;
- namespace {
- class Thumb2ITBlock : public MachineFunctionPass {
- public:
- static char ID;
- bool restrictIT;
- const Thumb2InstrInfo *TII;
- const TargetRegisterInfo *TRI;
- ARMFunctionInfo *AFI;
- Thumb2ITBlock() : MachineFunctionPass(ID) {}
- bool runOnMachineFunction(MachineFunction &Fn) override;
- MachineFunctionProperties getRequiredProperties() const override {
- return MachineFunctionProperties().set(
- MachineFunctionProperties::Property::NoVRegs);
- }
- StringRef getPassName() const override {
- return PASS_NAME;
- }
- private:
- bool MoveCopyOutOfITBlock(MachineInstr *MI,
- ARMCC::CondCodes CC, ARMCC::CondCodes OCC,
- RegisterSet &Defs, RegisterSet &Uses);
- bool InsertITInstructions(MachineBasicBlock &Block);
- };
- char Thumb2ITBlock::ID = 0;
- } // end anonymous namespace
- INITIALIZE_PASS(Thumb2ITBlock, DEBUG_TYPE, PASS_NAME, false, false)
- /// TrackDefUses - Tracking what registers are being defined and used by
- /// instructions in the IT block. This also tracks "dependencies", i.e. uses
- /// in the IT block that are defined before the IT instruction.
- static void TrackDefUses(MachineInstr *MI, RegisterSet &Defs, RegisterSet &Uses,
- const TargetRegisterInfo *TRI) {
- using RegList = SmallVector<unsigned, 4>;
- RegList LocalDefs;
- RegList LocalUses;
- for (auto &MO : MI->operands()) {
- if (!MO.isReg())
- continue;
- Register Reg = MO.getReg();
- if (!Reg || Reg == ARM::ITSTATE || Reg == ARM::SP)
- continue;
- if (MO.isUse())
- LocalUses.push_back(Reg);
- else
- LocalDefs.push_back(Reg);
- }
- auto InsertUsesDefs = [&](RegList &Regs, RegisterSet &UsesDefs) {
- for (unsigned Reg : Regs)
- for (MCSubRegIterator Subreg(Reg, TRI, /*IncludeSelf=*/true);
- Subreg.isValid(); ++Subreg)
- UsesDefs.insert(*Subreg);
- };
- InsertUsesDefs(LocalDefs, Defs);
- InsertUsesDefs(LocalUses, Uses);
- }
- /// Clear kill flags for any uses in the given set. This will likely
- /// conservatively remove more kill flags than are necessary, but removing them
- /// is safer than incorrect kill flags remaining on instructions.
- static void ClearKillFlags(MachineInstr *MI, RegisterSet &Uses) {
- for (MachineOperand &MO : MI->operands()) {
- if (!MO.isReg() || MO.isDef() || !MO.isKill())
- continue;
- if (!Uses.count(MO.getReg()))
- continue;
- MO.setIsKill(false);
- }
- }
- static bool isCopy(MachineInstr *MI) {
- switch (MI->getOpcode()) {
- default:
- return false;
- case ARM::MOVr:
- case ARM::MOVr_TC:
- case ARM::tMOVr:
- case ARM::t2MOVr:
- return true;
- }
- }
- bool
- Thumb2ITBlock::MoveCopyOutOfITBlock(MachineInstr *MI,
- ARMCC::CondCodes CC, ARMCC::CondCodes OCC,
- RegisterSet &Defs, RegisterSet &Uses) {
- if (!isCopy(MI))
- return false;
- // llvm models select's as two-address instructions. That means a copy
- // is inserted before a t2MOVccr, etc. If the copy is scheduled in
- // between selects we would end up creating multiple IT blocks.
- assert(MI->getOperand(0).getSubReg() == 0 &&
- MI->getOperand(1).getSubReg() == 0 &&
- "Sub-register indices still around?");
- Register DstReg = MI->getOperand(0).getReg();
- Register SrcReg = MI->getOperand(1).getReg();
- // First check if it's safe to move it.
- if (Uses.count(DstReg) || Defs.count(SrcReg))
- return false;
- // If the CPSR is defined by this copy, then we don't want to move it. E.g.,
- // if we have:
- //
- // movs r1, r1
- // rsb r1, 0
- // movs r2, r2
- // rsb r2, 0
- //
- // we don't want this to be converted to:
- //
- // movs r1, r1
- // movs r2, r2
- // itt mi
- // rsb r1, 0
- // rsb r2, 0
- //
- const MCInstrDesc &MCID = MI->getDesc();
- if (MI->hasOptionalDef() &&
- MI->getOperand(MCID.getNumOperands() - 1).getReg() == ARM::CPSR)
- return false;
- // Then peek at the next instruction to see if it's predicated on CC or OCC.
- // If not, then there is nothing to be gained by moving the copy.
- MachineBasicBlock::iterator I = MI;
- ++I;
- MachineBasicBlock::iterator E = MI->getParent()->end();
- while (I != E && I->isDebugInstr())
- ++I;
- if (I != E) {
- Register NPredReg;
- ARMCC::CondCodes NCC = getITInstrPredicate(*I, NPredReg);
- if (NCC == CC || NCC == OCC)
- return true;
- }
- return false;
- }
- bool Thumb2ITBlock::InsertITInstructions(MachineBasicBlock &MBB) {
- bool Modified = false;
- RegisterSet Defs, Uses;
- MachineBasicBlock::iterator MBBI = MBB.begin(), E = MBB.end();
- while (MBBI != E) {
- MachineInstr *MI = &*MBBI;
- DebugLoc dl = MI->getDebugLoc();
- Register PredReg;
- ARMCC::CondCodes CC = getITInstrPredicate(*MI, PredReg);
- if (CC == ARMCC::AL) {
- ++MBBI;
- continue;
- }
- Defs.clear();
- Uses.clear();
- TrackDefUses(MI, Defs, Uses, TRI);
- // Insert an IT instruction.
- MachineInstrBuilder MIB = BuildMI(MBB, MBBI, dl, TII->get(ARM::t2IT))
- .addImm(CC);
- // Add implicit use of ITSTATE to IT block instructions.
- MI->addOperand(MachineOperand::CreateReg(ARM::ITSTATE, false/*ifDef*/,
- true/*isImp*/, false/*isKill*/));
- MachineInstr *LastITMI = MI;
- MachineBasicBlock::iterator InsertPos = MIB.getInstr();
- ++MBBI;
- // Form IT block.
- ARMCC::CondCodes OCC = ARMCC::getOppositeCondition(CC);
- unsigned Mask = 0, Pos = 3;
- // v8 IT blocks are limited to one conditional op unless -arm-no-restrict-it
- // is set: skip the loop
- if (!restrictIT) {
- // Branches, including tricky ones like LDM_RET, need to end an IT
- // block so check the instruction we just put in the block.
- for (; MBBI != E && Pos &&
- (!MI->isBranch() && !MI->isReturn()) ; ++MBBI) {
- if (MBBI->isDebugInstr())
- continue;
- MachineInstr *NMI = &*MBBI;
- MI = NMI;
- Register NPredReg;
- ARMCC::CondCodes NCC = getITInstrPredicate(*NMI, NPredReg);
- if (NCC == CC || NCC == OCC) {
- Mask |= ((NCC ^ CC) & 1) << Pos;
- // Add implicit use of ITSTATE.
- NMI->addOperand(MachineOperand::CreateReg(ARM::ITSTATE, false/*ifDef*/,
- true/*isImp*/, false/*isKill*/));
- LastITMI = NMI;
- } else {
- if (NCC == ARMCC::AL &&
- MoveCopyOutOfITBlock(NMI, CC, OCC, Defs, Uses)) {
- --MBBI;
- MBB.remove(NMI);
- MBB.insert(InsertPos, NMI);
- ClearKillFlags(MI, Uses);
- ++NumMovedInsts;
- continue;
- }
- break;
- }
- TrackDefUses(NMI, Defs, Uses, TRI);
- --Pos;
- }
- }
- // Finalize IT mask.
- Mask |= (1 << Pos);
- MIB.addImm(Mask);
- // Last instruction in IT block kills ITSTATE.
- LastITMI->findRegisterUseOperand(ARM::ITSTATE)->setIsKill();
- // Finalize the bundle.
- finalizeBundle(MBB, InsertPos.getInstrIterator(),
- ++LastITMI->getIterator());
- Modified = true;
- ++NumITs;
- }
- return Modified;
- }
- bool Thumb2ITBlock::runOnMachineFunction(MachineFunction &Fn) {
- const ARMSubtarget &STI =
- static_cast<const ARMSubtarget &>(Fn.getSubtarget());
- if (!STI.isThumb2())
- return false;
- AFI = Fn.getInfo<ARMFunctionInfo>();
- TII = static_cast<const Thumb2InstrInfo *>(STI.getInstrInfo());
- TRI = STI.getRegisterInfo();
- restrictIT = STI.restrictIT();
- if (!AFI->isThumbFunction())
- return false;
- bool Modified = false;
- for (auto &MBB : Fn )
- Modified |= InsertITInstructions(MBB);
- if (Modified)
- AFI->setHasITBlocks(true);
- return Modified;
- }
- /// createThumb2ITBlockPass - Returns an instance of the Thumb2 IT blocks
- /// insertion pass.
- FunctionPass *llvm::createThumb2ITBlockPass() { return new Thumb2ITBlock(); }
|