136 lines
4.9 KiB
C++
136 lines
4.9 KiB
C++
|
//===----- X86AvoidTrailingCall.cpp - Insert int3 after trailing calls ----===//
|
||
|
//
|
||
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
||
|
// See https://llvm.org/LICENSE.txt for license information.
|
||
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
||
|
//
|
||
|
//===----------------------------------------------------------------------===//
|
||
|
//
|
||
|
// The Windows x64 unwinder decodes the instruction stream during unwinding.
|
||
|
// The unwinder decodes forward from the current PC to detect epilogue code
|
||
|
// patterns.
|
||
|
//
|
||
|
// First, this means that there must be an instruction after every
|
||
|
// call instruction for the unwinder to decode. LLVM must maintain the invariant
|
||
|
// that the last instruction of a function or funclet is not a call, or the
|
||
|
// unwinder may decode into the next function. Similarly, a call may not
|
||
|
// immediately precede an epilogue code pattern. As of this writing, the
|
||
|
// SEH_Epilogue pseudo instruction takes care of that.
|
||
|
//
|
||
|
// Second, all non-tail call jump targets must be within the *half-open*
|
||
|
// interval of the bounds of the function. The unwinder distinguishes between
|
||
|
// internal jump instructions and tail calls in an epilogue sequence by checking
|
||
|
// the jump target against the function bounds from the .pdata section. This
|
||
|
// means that the last regular MBB of an LLVM function must not be empty if
|
||
|
// there are regular jumps targeting it.
|
||
|
//
|
||
|
// This pass upholds these invariants by ensuring that blocks at the end of a
|
||
|
// function or funclet are a) not empty and b) do not end in a CALL instruction.
|
||
|
//
|
||
|
// Unwinder implementation for reference:
|
||
|
// https://github.com/dotnet/coreclr/blob/a9f3fc16483eecfc47fb79c362811d870be02249/src/unwinder/amd64/unwinder_amd64.cpp#L1015
|
||
|
//
|
||
|
//===----------------------------------------------------------------------===//
|
||
|
|
||
|
#include "X86.h"
|
||
|
#include "X86InstrInfo.h"
|
||
|
#include "X86Subtarget.h"
|
||
|
#include "llvm/CodeGen/MachineInstrBuilder.h"
|
||
|
|
||
|
#define AVOIDCALL_DESC "X86 avoid trailing call pass"
|
||
|
#define AVOIDCALL_NAME "x86-avoid-trailing-call"
|
||
|
|
||
|
#define DEBUG_TYPE AVOIDCALL_NAME
|
||
|
|
||
|
using namespace llvm;
|
||
|
|
||
|
namespace {
|
||
|
class X86AvoidTrailingCallPass : public MachineFunctionPass {
|
||
|
public:
|
||
|
X86AvoidTrailingCallPass() : MachineFunctionPass(ID) {}
|
||
|
|
||
|
bool runOnMachineFunction(MachineFunction &MF) override;
|
||
|
|
||
|
static char ID;
|
||
|
|
||
|
private:
|
||
|
StringRef getPassName() const override { return AVOIDCALL_DESC; }
|
||
|
};
|
||
|
} // end anonymous namespace
|
||
|
|
||
|
char X86AvoidTrailingCallPass::ID = 0;
|
||
|
|
||
|
FunctionPass *llvm::createX86AvoidTrailingCallPass() {
|
||
|
return new X86AvoidTrailingCallPass();
|
||
|
}
|
||
|
|
||
|
INITIALIZE_PASS(X86AvoidTrailingCallPass, AVOIDCALL_NAME, AVOIDCALL_DESC, false, false)
|
||
|
|
||
|
// A real instruction is a non-meta, non-pseudo instruction. Some pseudos
|
||
|
// expand to nothing, and some expand to code. This logic conservatively assumes
|
||
|
// they might expand to nothing.
|
||
|
static bool isRealInstruction(MachineInstr &MI) {
|
||
|
return !MI.isPseudo() && !MI.isMetaInstruction();
|
||
|
}
|
||
|
|
||
|
// Return true if this is a call instruction, but not a tail call.
|
||
|
static bool isCallInstruction(const MachineInstr &MI) {
|
||
|
return MI.isCall() && !MI.isReturn();
|
||
|
}
|
||
|
|
||
|
bool X86AvoidTrailingCallPass::runOnMachineFunction(MachineFunction &MF) {
|
||
|
const X86Subtarget &STI = MF.getSubtarget<X86Subtarget>();
|
||
|
const X86InstrInfo &TII = *STI.getInstrInfo();
|
||
|
assert(STI.isTargetWin64() && "pass only runs on Win64");
|
||
|
|
||
|
// We don't need to worry about any of the invariants described above if there
|
||
|
// is no unwind info (CFI).
|
||
|
if (!MF.hasWinCFI())
|
||
|
return false;
|
||
|
|
||
|
// FIXME: Perhaps this pass should also replace SEH_Epilogue by inserting nops
|
||
|
// before epilogues.
|
||
|
|
||
|
bool Changed = false;
|
||
|
for (MachineBasicBlock &MBB : MF) {
|
||
|
// Look for basic blocks that precede funclet entries or are at the end of
|
||
|
// the function.
|
||
|
MachineBasicBlock *NextMBB = MBB.getNextNode();
|
||
|
if (NextMBB && !NextMBB->isEHFuncletEntry())
|
||
|
continue;
|
||
|
|
||
|
// Find the last real instruction in this block.
|
||
|
auto LastRealInstr = llvm::find_if(reverse(MBB), isRealInstruction);
|
||
|
|
||
|
// If the block is empty or the last real instruction is a call instruction,
|
||
|
// insert an int3. If there is a call instruction, insert the int3 between
|
||
|
// the call and any labels or other meta instructions. If the block is
|
||
|
// empty, insert at block end.
|
||
|
bool IsEmpty = LastRealInstr == MBB.rend();
|
||
|
bool IsCall = !IsEmpty && isCallInstruction(*LastRealInstr);
|
||
|
if (IsEmpty || IsCall) {
|
||
|
LLVM_DEBUG({
|
||
|
if (IsCall) {
|
||
|
dbgs() << "inserting int3 after trailing call instruction:\n";
|
||
|
LastRealInstr->dump();
|
||
|
dbgs() << '\n';
|
||
|
} else {
|
||
|
dbgs() << "inserting int3 in trailing empty MBB:\n";
|
||
|
MBB.dump();
|
||
|
}
|
||
|
});
|
||
|
|
||
|
MachineBasicBlock::iterator MBBI = MBB.end();
|
||
|
DebugLoc DL;
|
||
|
if (IsCall) {
|
||
|
MBBI = std::next(LastRealInstr.getReverse());
|
||
|
DL = LastRealInstr->getDebugLoc();
|
||
|
}
|
||
|
BuildMI(MBB, MBBI, DL, TII.get(X86::INT3));
|
||
|
Changed = true;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
return Changed;
|
||
|
}
|