123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135 |
- //===----- X86AvoidTrailingCall.cpp - Insert int3 after trailing calls ----===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- //
- // The Windows x64 unwinder decodes the instruction stream during unwinding.
- // The unwinder decodes forward from the current PC to detect epilogue code
- // patterns.
- //
- // First, this means that there must be an instruction after every
- // call instruction for the unwinder to decode. LLVM must maintain the invariant
- // that the last instruction of a function or funclet is not a call, or the
- // unwinder may decode into the next function. Similarly, a call may not
- // immediately precede an epilogue code pattern. As of this writing, the
- // SEH_Epilogue pseudo instruction takes care of that.
- //
- // Second, all non-tail call jump targets must be within the *half-open*
- // interval of the bounds of the function. The unwinder distinguishes between
- // internal jump instructions and tail calls in an epilogue sequence by checking
- // the jump target against the function bounds from the .pdata section. This
- // means that the last regular MBB of an LLVM function must not be empty if
- // there are regular jumps targeting it.
- //
- // This pass upholds these invariants by ensuring that blocks at the end of a
- // function or funclet are a) not empty and b) do not end in a CALL instruction.
- //
- // Unwinder implementation for reference:
- // https://github.com/dotnet/coreclr/blob/a9f3fc16483eecfc47fb79c362811d870be02249/src/unwinder/amd64/unwinder_amd64.cpp#L1015
- //
- //===----------------------------------------------------------------------===//
- #include "X86.h"
- #include "X86InstrInfo.h"
- #include "X86Subtarget.h"
- #include "llvm/CodeGen/MachineInstrBuilder.h"
- #define AVOIDCALL_DESC "X86 avoid trailing call pass"
- #define AVOIDCALL_NAME "x86-avoid-trailing-call"
- #define DEBUG_TYPE AVOIDCALL_NAME
- using namespace llvm;
- namespace {
- class X86AvoidTrailingCallPass : public MachineFunctionPass {
- public:
- X86AvoidTrailingCallPass() : MachineFunctionPass(ID) {}
- bool runOnMachineFunction(MachineFunction &MF) override;
- static char ID;
- private:
- StringRef getPassName() const override { return AVOIDCALL_DESC; }
- };
- } // end anonymous namespace
- char X86AvoidTrailingCallPass::ID = 0;
- FunctionPass *llvm::createX86AvoidTrailingCallPass() {
- return new X86AvoidTrailingCallPass();
- }
- INITIALIZE_PASS(X86AvoidTrailingCallPass, AVOIDCALL_NAME, AVOIDCALL_DESC, false, false)
- // A real instruction is a non-meta, non-pseudo instruction. Some pseudos
- // expand to nothing, and some expand to code. This logic conservatively assumes
- // they might expand to nothing.
- static bool isRealInstruction(MachineInstr &MI) {
- return !MI.isPseudo() && !MI.isMetaInstruction();
- }
- // Return true if this is a call instruction, but not a tail call.
- static bool isCallInstruction(const MachineInstr &MI) {
- return MI.isCall() && !MI.isReturn();
- }
- bool X86AvoidTrailingCallPass::runOnMachineFunction(MachineFunction &MF) {
- const X86Subtarget &STI = MF.getSubtarget<X86Subtarget>();
- const X86InstrInfo &TII = *STI.getInstrInfo();
- assert(STI.isTargetWin64() && "pass only runs on Win64");
- // We don't need to worry about any of the invariants described above if there
- // is no unwind info (CFI).
- if (!MF.hasWinCFI())
- return false;
- // FIXME: Perhaps this pass should also replace SEH_Epilogue by inserting nops
- // before epilogues.
- bool Changed = false;
- for (MachineBasicBlock &MBB : MF) {
- // Look for basic blocks that precede funclet entries or are at the end of
- // the function.
- MachineBasicBlock *NextMBB = MBB.getNextNode();
- if (NextMBB && !NextMBB->isEHFuncletEntry())
- continue;
- // Find the last real instruction in this block.
- auto LastRealInstr = llvm::find_if(reverse(MBB), isRealInstruction);
- // If the block is empty or the last real instruction is a call instruction,
- // insert an int3. If there is a call instruction, insert the int3 between
- // the call and any labels or other meta instructions. If the block is
- // empty, insert at block end.
- bool IsEmpty = LastRealInstr == MBB.rend();
- bool IsCall = !IsEmpty && isCallInstruction(*LastRealInstr);
- if (IsEmpty || IsCall) {
- LLVM_DEBUG({
- if (IsCall) {
- dbgs() << "inserting int3 after trailing call instruction:\n";
- LastRealInstr->dump();
- dbgs() << '\n';
- } else {
- dbgs() << "inserting int3 in trailing empty MBB:\n";
- MBB.dump();
- }
- });
- MachineBasicBlock::iterator MBBI = MBB.end();
- DebugLoc DL;
- if (IsCall) {
- MBBI = std::next(LastRealInstr.getReverse());
- DL = LastRealInstr->getDebugLoc();
- }
- BuildMI(MBB, MBBI, DL, TII.get(X86::INT3));
- Changed = true;
- }
- }
- return Changed;
- }
|