123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293 |
- //===- PPCMacroFusion.cpp - PowerPC Macro Fusion --------------------------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- //
- /// \file This file contains the PowerPC implementation of the DAG scheduling
- /// mutation to pair instructions back to back.
- //
- //===----------------------------------------------------------------------===//
- #include "PPC.h"
- #include "PPCSubtarget.h"
- #include "llvm/ADT/DenseSet.h"
- #include "llvm/CodeGen/MacroFusion.h"
- using namespace llvm;
- namespace {
- class FusionFeature {
- public:
- typedef SmallDenseSet<unsigned> FusionOpSet;
- enum FusionKind {
- #define FUSION_KIND(KIND) FK_##KIND
- #define FUSION_FEATURE(KIND, HAS_FEATURE, DEP_OP_IDX, OPSET1, OPSET2) \
- FUSION_KIND(KIND),
- #include "PPCMacroFusion.def"
- FUSION_KIND(END)
- };
- private:
- // Each fusion feature is assigned with one fusion kind. All the
- // instructions with the same fusion kind have the same fusion characteristic.
- FusionKind Kd;
- // True if this feature is enabled.
- bool Supported;
- // li rx, si
- // load rt, ra, rx
- // The dependent operand index in the second op(load). And the negative means
- // it could be any one.
- int DepOpIdx;
- // The first fusion op set.
- FusionOpSet OpSet1;
- // The second fusion op set.
- FusionOpSet OpSet2;
- public:
- FusionFeature(FusionKind Kind, bool HasFeature, int Index,
- const FusionOpSet &First, const FusionOpSet &Second) :
- Kd(Kind), Supported(HasFeature), DepOpIdx(Index), OpSet1(First),
- OpSet2(Second) {}
- bool hasOp1(unsigned Opc) const { return OpSet1.contains(Opc); }
- bool hasOp2(unsigned Opc) const { return OpSet2.contains(Opc); }
- bool isSupported() const { return Supported; }
- Optional<unsigned> depOpIdx() const {
- if (DepOpIdx < 0)
- return None;
- return DepOpIdx;
- }
- FusionKind getKind() const { return Kd; }
- };
- static bool matchingRegOps(const MachineInstr &FirstMI,
- int FirstMIOpIndex,
- const MachineInstr &SecondMI,
- int SecondMIOpIndex) {
- const MachineOperand &Op1 = FirstMI.getOperand(FirstMIOpIndex);
- const MachineOperand &Op2 = SecondMI.getOperand(SecondMIOpIndex);
- if (!Op1.isReg() || !Op2.isReg())
- return false;
- return Op1.getReg() == Op2.getReg();
- }
- static bool matchingImmOps(const MachineInstr &MI,
- int MIOpIndex,
- int64_t Expect,
- unsigned ExtendFrom = 64) {
- const MachineOperand &Op = MI.getOperand(MIOpIndex);
- if (!Op.isImm())
- return false;
- int64_t Imm = Op.getImm();
- if (ExtendFrom < 64)
- Imm = SignExtend64(Imm, ExtendFrom);
- return Imm == Expect;
- }
- // Return true if the FirstMI meets the constraints of SecondMI according to
- // fusion specification.
- static bool checkOpConstraints(FusionFeature::FusionKind Kd,
- const MachineInstr &FirstMI,
- const MachineInstr &SecondMI) {
- switch (Kd) {
- // The hardware didn't require any specific check for the fused instructions'
- // operands. Therefore, return true to indicate that, it is fusable.
- default: return true;
- // [addi rt,ra,si - lxvd2x xt,ra,rb] etc.
- case FusionFeature::FK_AddiLoad: {
- // lxvd2x(ra) cannot be zero
- const MachineOperand &RA = SecondMI.getOperand(1);
- if (!RA.isReg())
- return true;
- return Register::isVirtualRegister(RA.getReg()) ||
- (RA.getReg() != PPC::ZERO && RA.getReg() != PPC::ZERO8);
- }
- // [addis rt,ra,si - ld rt,ds(ra)] etc.
- case FusionFeature::FK_AddisLoad: {
- const MachineOperand &RT = SecondMI.getOperand(0);
- if (!RT.isReg())
- return true;
- // Only check it for non-virtual register.
- if (!Register::isVirtualRegister(RT.getReg()))
- // addis(rt) = ld(ra) = ld(rt)
- // ld(rt) cannot be zero
- if (!matchingRegOps(SecondMI, 0, SecondMI, 2) ||
- (RT.getReg() == PPC::ZERO || RT.getReg() == PPC::ZERO8))
- return false;
- // addis(si) first 12 bits must be all 1s or all 0s
- const MachineOperand &SI = FirstMI.getOperand(2);
- if (!SI.isImm())
- return true;
- int64_t Imm = SI.getImm();
- if (((Imm & 0xFFF0) != 0) && ((Imm & 0xFFF0) != 0xFFF0))
- return false;
- // If si = 1111111111110000 and the msb of the d/ds field of the load equals
- // 1, then fusion does not occur.
- if ((Imm & 0xFFF0) == 0xFFF0) {
- const MachineOperand &D = SecondMI.getOperand(1);
- if (!D.isImm())
- return true;
- // 14 bit for DS field, while 16 bit for D field.
- int MSB = 15;
- if (SecondMI.getOpcode() == PPC::LD)
- MSB = 13;
- return (D.getImm() & (1ULL << MSB)) == 0;
- }
- return true;
- }
- case FusionFeature::FK_SldiAdd:
- return (matchingImmOps(FirstMI, 2, 3) && matchingImmOps(FirstMI, 3, 60)) ||
- (matchingImmOps(FirstMI, 2, 6) && matchingImmOps(FirstMI, 3, 57));
- // rldicl rx, ra, 1, 0 - xor
- case FusionFeature::FK_RotateLeftXor:
- return matchingImmOps(FirstMI, 2, 1) && matchingImmOps(FirstMI, 3, 0);
- // rldicr rx, ra, 1, 63 - xor
- case FusionFeature::FK_RotateRightXor:
- return matchingImmOps(FirstMI, 2, 1) && matchingImmOps(FirstMI, 3, 63);
- // We actually use CMPW* and CMPD*, 'l' doesn't exist as an operand in instr.
- // { lbz,lbzx,lhz,lhzx,lwz,lwzx } - cmpi 0,1,rx,{ 0,1,-1 }
- // { lbz,lbzx,lhz,lhzx,lwz,lwzx } - cmpli 0,L,rx,{ 0,1 }
- case FusionFeature::FK_LoadCmp1:
- // { ld,ldx } - cmpi 0,1,rx,{ 0,1,-1 }
- // { ld,ldx } - cmpli 0,1,rx,{ 0,1 }
- case FusionFeature::FK_LoadCmp2: {
- const MachineOperand &BT = SecondMI.getOperand(0);
- if (!BT.isReg() ||
- (!Register::isVirtualRegister(BT.getReg()) && BT.getReg() != PPC::CR0))
- return false;
- if (SecondMI.getOpcode() == PPC::CMPDI &&
- matchingImmOps(SecondMI, 2, -1, 16))
- return true;
- return matchingImmOps(SecondMI, 2, 0) || matchingImmOps(SecondMI, 2, 1);
- }
- // { lha,lhax,lwa,lwax } - cmpi 0,L,rx,{ 0,1,-1 }
- case FusionFeature::FK_LoadCmp3: {
- const MachineOperand &BT = SecondMI.getOperand(0);
- if (!BT.isReg() ||
- (!Register::isVirtualRegister(BT.getReg()) && BT.getReg() != PPC::CR0))
- return false;
- return matchingImmOps(SecondMI, 2, 0) || matchingImmOps(SecondMI, 2, 1) ||
- matchingImmOps(SecondMI, 2, -1, 16);
- }
- // mtctr - { bcctr,bcctrl }
- case FusionFeature::FK_ZeroMoveCTR:
- // ( mtctr rx ) is alias of ( mtspr 9, rx )
- return (FirstMI.getOpcode() != PPC::MTSPR &&
- FirstMI.getOpcode() != PPC::MTSPR8) ||
- matchingImmOps(FirstMI, 0, 9);
- // mtlr - { bclr,bclrl }
- case FusionFeature::FK_ZeroMoveLR:
- // ( mtlr rx ) is alias of ( mtspr 8, rx )
- return (FirstMI.getOpcode() != PPC::MTSPR &&
- FirstMI.getOpcode() != PPC::MTSPR8) ||
- matchingImmOps(FirstMI, 0, 8);
- // addis rx,ra,si - addi rt,rx,SI, SI >= 0
- case FusionFeature::FK_AddisAddi: {
- const MachineOperand &RA = FirstMI.getOperand(1);
- const MachineOperand &SI = SecondMI.getOperand(2);
- if (!SI.isImm() || !RA.isReg())
- return false;
- if (RA.getReg() == PPC::ZERO || RA.getReg() == PPC::ZERO8)
- return false;
- return SignExtend64(SI.getImm(), 16) >= 0;
- }
- // addi rx,ra,si - addis rt,rx,SI, ra > 0, SI >= 2
- case FusionFeature::FK_AddiAddis: {
- const MachineOperand &RA = FirstMI.getOperand(1);
- const MachineOperand &SI = FirstMI.getOperand(2);
- if (!SI.isImm() || !RA.isReg())
- return false;
- if (RA.getReg() == PPC::ZERO || RA.getReg() == PPC::ZERO8)
- return false;
- int64_t ExtendedSI = SignExtend64(SI.getImm(), 16);
- return ExtendedSI >= 2;
- }
- }
- llvm_unreachable("All the cases should have been handled");
- return true;
- }
- /// Check if the instr pair, FirstMI and SecondMI, should be fused together.
- /// Given SecondMI, when FirstMI is unspecified, then check if SecondMI may be
- /// part of a fused pair at all.
- static bool shouldScheduleAdjacent(const TargetInstrInfo &TII,
- const TargetSubtargetInfo &TSI,
- const MachineInstr *FirstMI,
- const MachineInstr &SecondMI) {
- // We use the PPC namespace to avoid the need to prefix opcodes with PPC:: in
- // the def file.
- using namespace PPC;
- const PPCSubtarget &ST = static_cast<const PPCSubtarget&>(TSI);
- static const FusionFeature FusionFeatures[] = {
- #define FUSION_FEATURE(KIND, HAS_FEATURE, DEP_OP_IDX, OPSET1, OPSET2) { \
- FusionFeature::FUSION_KIND(KIND), ST.HAS_FEATURE(), DEP_OP_IDX, { OPSET1 },\
- { OPSET2 } },
- #include "PPCMacroFusion.def"
- };
- #undef FUSION_KIND
- for (auto &Feature : FusionFeatures) {
- // Skip if the feature is not supported.
- if (!Feature.isSupported())
- continue;
- // Only when the SecondMI is fusable, we are starting to look for the
- // fusable FirstMI.
- if (Feature.hasOp2(SecondMI.getOpcode())) {
- // If FirstMI == nullptr, that means, we're only checking whether SecondMI
- // can be fused at all.
- if (!FirstMI)
- return true;
- // Checking if the FirstMI is fusable with the SecondMI.
- if (!Feature.hasOp1(FirstMI->getOpcode()))
- continue;
- auto DepOpIdx = Feature.depOpIdx();
- if (DepOpIdx.hasValue()) {
- // Checking if the result of the FirstMI is the desired operand of the
- // SecondMI if the DepOpIdx is set. Otherwise, ignore it.
- if (!matchingRegOps(*FirstMI, 0, SecondMI, *DepOpIdx))
- return false;
- }
-
- // Checking more on the instruction operands.
- if (checkOpConstraints(Feature.getKind(), *FirstMI, SecondMI))
- return true;
- }
- }
- return false;
- }
- } // end anonymous namespace
- namespace llvm {
- std::unique_ptr<ScheduleDAGMutation> createPowerPCMacroFusionDAGMutation () {
- return createMacroFusionDAGMutation(shouldScheduleAdjacent);
- }
- } // end namespace llvm
|