212 lines
7.4 KiB
C++
212 lines
7.4 KiB
C++
//== WebAssemblyMemIntrinsicResults.cpp - Optimize memory intrinsic results ==//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
///
|
|
/// \file
|
|
/// This file implements an optimization pass using memory intrinsic results.
|
|
///
|
|
/// Calls to memory intrinsics (memcpy, memmove, memset) return the destination
|
|
/// address. They are in the form of
|
|
/// %dst_new = call @memcpy %dst, %src, %len
|
|
/// where %dst and %dst_new registers contain the same value.
|
|
///
|
|
/// This is to enable an optimization wherein uses of the %dst register used in
|
|
/// the parameter can be replaced by uses of the %dst_new register used in the
|
|
/// result, making the %dst register more likely to be single-use, thus more
|
|
/// likely to be useful to register stackifying, and potentially also exposing
|
|
/// the call instruction itself to register stackifying. These both can reduce
|
|
/// local.get/local.set traffic.
|
|
///
|
|
/// The LLVM intrinsics for these return void so they can't use the returned
|
|
/// attribute and consequently aren't handled by the OptimizeReturned pass.
|
|
///
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "MCTargetDesc/WebAssemblyMCTargetDesc.h"
|
|
#include "WebAssembly.h"
|
|
#include "WebAssemblyMachineFunctionInfo.h"
|
|
#include "WebAssemblySubtarget.h"
|
|
#include "llvm/Analysis/TargetLibraryInfo.h"
|
|
#include "llvm/CodeGen/LiveIntervals.h"
|
|
#include "llvm/CodeGen/MachineBlockFrequencyInfo.h"
|
|
#include "llvm/CodeGen/MachineDominators.h"
|
|
#include "llvm/CodeGen/MachineRegisterInfo.h"
|
|
#include "llvm/CodeGen/Passes.h"
|
|
#include "llvm/Support/Debug.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
using namespace llvm;
|
|
|
|
#define DEBUG_TYPE "wasm-mem-intrinsic-results"
|
|
|
|
namespace {
|
|
class WebAssemblyMemIntrinsicResults final : public MachineFunctionPass {
|
|
public:
|
|
static char ID; // Pass identification, replacement for typeid
|
|
WebAssemblyMemIntrinsicResults() : MachineFunctionPass(ID) {}
|
|
|
|
StringRef getPassName() const override {
|
|
return "WebAssembly Memory Intrinsic Results";
|
|
}
|
|
|
|
void getAnalysisUsage(AnalysisUsage &AU) const override {
|
|
AU.setPreservesCFG();
|
|
AU.addRequired<MachineBlockFrequencyInfo>();
|
|
AU.addPreserved<MachineBlockFrequencyInfo>();
|
|
AU.addRequired<MachineDominatorTree>();
|
|
AU.addPreserved<MachineDominatorTree>();
|
|
AU.addRequired<LiveIntervals>();
|
|
AU.addPreserved<SlotIndexes>();
|
|
AU.addPreserved<LiveIntervals>();
|
|
AU.addRequired<TargetLibraryInfoWrapperPass>();
|
|
MachineFunctionPass::getAnalysisUsage(AU);
|
|
}
|
|
|
|
bool runOnMachineFunction(MachineFunction &MF) override;
|
|
|
|
private:
|
|
};
|
|
} // end anonymous namespace
|
|
|
|
char WebAssemblyMemIntrinsicResults::ID = 0;
|
|
INITIALIZE_PASS(WebAssemblyMemIntrinsicResults, DEBUG_TYPE,
|
|
"Optimize memory intrinsic result values for WebAssembly",
|
|
false, false)
|
|
|
|
FunctionPass *llvm::createWebAssemblyMemIntrinsicResults() {
|
|
return new WebAssemblyMemIntrinsicResults();
|
|
}
|
|
|
|
// Replace uses of FromReg with ToReg if they are dominated by MI.
|
|
static bool replaceDominatedUses(MachineBasicBlock &MBB, MachineInstr &MI,
|
|
unsigned FromReg, unsigned ToReg,
|
|
const MachineRegisterInfo &MRI,
|
|
MachineDominatorTree &MDT,
|
|
LiveIntervals &LIS) {
|
|
bool Changed = false;
|
|
|
|
LiveInterval *FromLI = &LIS.getInterval(FromReg);
|
|
LiveInterval *ToLI = &LIS.getInterval(ToReg);
|
|
|
|
SlotIndex FromIdx = LIS.getInstructionIndex(MI).getRegSlot();
|
|
VNInfo *FromVNI = FromLI->getVNInfoAt(FromIdx);
|
|
|
|
SmallVector<SlotIndex, 4> Indices;
|
|
|
|
for (auto I = MRI.use_nodbg_begin(FromReg), E = MRI.use_nodbg_end();
|
|
I != E;) {
|
|
MachineOperand &O = *I++;
|
|
MachineInstr *Where = O.getParent();
|
|
|
|
// Check that MI dominates the instruction in the normal way.
|
|
if (&MI == Where || !MDT.dominates(&MI, Where))
|
|
continue;
|
|
|
|
// If this use gets a different value, skip it.
|
|
SlotIndex WhereIdx = LIS.getInstructionIndex(*Where);
|
|
VNInfo *WhereVNI = FromLI->getVNInfoAt(WhereIdx);
|
|
if (WhereVNI && WhereVNI != FromVNI)
|
|
continue;
|
|
|
|
// Make sure ToReg isn't clobbered before it gets there.
|
|
VNInfo *ToVNI = ToLI->getVNInfoAt(WhereIdx);
|
|
if (ToVNI && ToVNI != FromVNI)
|
|
continue;
|
|
|
|
Changed = true;
|
|
LLVM_DEBUG(dbgs() << "Setting operand " << O << " in " << *Where << " from "
|
|
<< MI << "\n");
|
|
O.setReg(ToReg);
|
|
|
|
// If the store's def was previously dead, it is no longer.
|
|
if (!O.isUndef()) {
|
|
MI.getOperand(0).setIsDead(false);
|
|
|
|
Indices.push_back(WhereIdx.getRegSlot());
|
|
}
|
|
}
|
|
|
|
if (Changed) {
|
|
// Extend ToReg's liveness.
|
|
LIS.extendToIndices(*ToLI, Indices);
|
|
|
|
// Shrink FromReg's liveness.
|
|
LIS.shrinkToUses(FromLI);
|
|
|
|
// If we replaced all dominated uses, FromReg is now killed at MI.
|
|
if (!FromLI->liveAt(FromIdx.getDeadSlot()))
|
|
MI.addRegisterKilled(FromReg, MBB.getParent()
|
|
->getSubtarget<WebAssemblySubtarget>()
|
|
.getRegisterInfo());
|
|
}
|
|
|
|
return Changed;
|
|
}
|
|
|
|
static bool optimizeCall(MachineBasicBlock &MBB, MachineInstr &MI,
|
|
const MachineRegisterInfo &MRI,
|
|
MachineDominatorTree &MDT, LiveIntervals &LIS,
|
|
const WebAssemblyTargetLowering &TLI,
|
|
const TargetLibraryInfo &LibInfo) {
|
|
MachineOperand &Op1 = MI.getOperand(1);
|
|
if (!Op1.isSymbol())
|
|
return false;
|
|
|
|
StringRef Name(Op1.getSymbolName());
|
|
bool CallReturnsInput = Name == TLI.getLibcallName(RTLIB::MEMCPY) ||
|
|
Name == TLI.getLibcallName(RTLIB::MEMMOVE) ||
|
|
Name == TLI.getLibcallName(RTLIB::MEMSET);
|
|
if (!CallReturnsInput)
|
|
return false;
|
|
|
|
LibFunc Func;
|
|
if (!LibInfo.getLibFunc(Name, Func))
|
|
return false;
|
|
|
|
Register FromReg = MI.getOperand(2).getReg();
|
|
Register ToReg = MI.getOperand(0).getReg();
|
|
if (MRI.getRegClass(FromReg) != MRI.getRegClass(ToReg))
|
|
report_fatal_error("Memory Intrinsic results: call to builtin function "
|
|
"with wrong signature, from/to mismatch");
|
|
return replaceDominatedUses(MBB, MI, FromReg, ToReg, MRI, MDT, LIS);
|
|
}
|
|
|
|
bool WebAssemblyMemIntrinsicResults::runOnMachineFunction(MachineFunction &MF) {
|
|
LLVM_DEBUG({
|
|
dbgs() << "********** Memory Intrinsic Results **********\n"
|
|
<< "********** Function: " << MF.getName() << '\n';
|
|
});
|
|
|
|
MachineRegisterInfo &MRI = MF.getRegInfo();
|
|
auto &MDT = getAnalysis<MachineDominatorTree>();
|
|
const WebAssemblyTargetLowering &TLI =
|
|
*MF.getSubtarget<WebAssemblySubtarget>().getTargetLowering();
|
|
const auto &LibInfo =
|
|
getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(MF.getFunction());
|
|
auto &LIS = getAnalysis<LiveIntervals>();
|
|
bool Changed = false;
|
|
|
|
// We don't preserve SSA form.
|
|
MRI.leaveSSA();
|
|
|
|
assert(MRI.tracksLiveness() &&
|
|
"MemIntrinsicResults expects liveness tracking");
|
|
|
|
for (auto &MBB : MF) {
|
|
LLVM_DEBUG(dbgs() << "Basic Block: " << MBB.getName() << '\n');
|
|
for (auto &MI : MBB)
|
|
switch (MI.getOpcode()) {
|
|
default:
|
|
break;
|
|
case WebAssembly::CALL:
|
|
Changed |= optimizeCall(MBB, MI, MRI, MDT, LIS, TLI, LibInfo);
|
|
break;
|
|
}
|
|
}
|
|
|
|
return Changed;
|
|
}
|