forked from OSchip/llvm-project
[llvm][Inline] Add a module level inliner
Add module level inliner, which is a minimum viable product at this point. Also add some tests for it. RFC: https://lists.llvm.org/pipermail/llvm-dev/2021-August/152297.html Reviewed By: kazu Differential Revision: https://reviews.llvm.org/D106448
This commit is contained in:
parent
b3267bb3af
commit
6cad45d5c6
|
@ -23,6 +23,7 @@
|
|||
#include "llvm/Support/PGOOptions.h"
|
||||
#include "llvm/Support/raw_ostream.h"
|
||||
#include "llvm/Transforms/IPO/Inliner.h"
|
||||
#include "llvm/Transforms/IPO/ModuleInliner.h"
|
||||
#include "llvm/Transforms/Instrumentation.h"
|
||||
#include "llvm/Transforms/Scalar/LoopPassManager.h"
|
||||
#include <vector>
|
||||
|
@ -196,6 +197,11 @@ public:
|
|||
ModuleInlinerWrapperPass buildInlinerPipeline(OptimizationLevel Level,
|
||||
ThinOrFullLTOPhase Phase);
|
||||
|
||||
/// Construct the module pipeline that performs inlining with
|
||||
/// module inliner pass.
|
||||
ModuleInlinerPass buildModuleInlinerPipeline(OptimizationLevel Level,
|
||||
ThinOrFullLTOPhase Phase);
|
||||
|
||||
/// Construct the core LLVM module optimization pipeline.
|
||||
///
|
||||
/// This pipeline focuses on optimizing the execution speed of the IR. It
|
||||
|
|
|
@ -0,0 +1,51 @@
|
|||
//===- ModuleInliner.h - Module level Inliner pass --------------*- C++ -*-===//
|
||||
//
|
||||
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
||||
// See https://llvm.org/LICENSE.txt for license information.
|
||||
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
||||
//
|
||||
//===----------------------------------------------------------------------===//
|
||||
|
||||
#ifndef LLVM_TRANSFORMS_IPO_MODULEINLINER_H
|
||||
#define LLVM_TRANSFORMS_IPO_MODULEINLINER_H
|
||||
|
||||
#include "llvm/Analysis/InlineAdvisor.h"
|
||||
#include "llvm/Analysis/InlineCost.h"
|
||||
#include "llvm/Analysis/ReplayInlineAdvisor.h"
|
||||
#include "llvm/Analysis/Utils/ImportedFunctionsInliningStatistics.h"
|
||||
#include "llvm/IR/PassManager.h"
|
||||
#include <utility>
|
||||
|
||||
namespace llvm {
|
||||
|
||||
class AssumptionCacheTracker;
|
||||
class ProfileSummaryInfo;
|
||||
|
||||
/// The module inliner pass for the new pass manager.
|
||||
///
|
||||
/// This pass wires together the inlining utilities and the inline cost
|
||||
/// analysis into a module pass. Different from SCC inliner, it considers every
|
||||
/// call in every function in the whole module and tries to inline if
|
||||
/// profitable. With this module level inliner, it is possible to evaluate more
|
||||
/// heuristics in the module level such like PriorityInlineOrder. It can be
|
||||
/// tuned with a number of parameters to control what cost model is used and
|
||||
/// what tradeoffs are made when making the decision.
|
||||
class ModuleInlinerPass : public PassInfoMixin<ModuleInlinerPass> {
|
||||
public:
|
||||
ModuleInlinerPass(InlineParams Params = getInlineParams(),
|
||||
InliningAdvisorMode Mode = InliningAdvisorMode::Default)
|
||||
: Params(Params), Mode(Mode){};
|
||||
ModuleInlinerPass(ModuleInlinerPass &&Arg) = default;
|
||||
|
||||
PreservedAnalyses run(Module &, ModuleAnalysisManager &);
|
||||
|
||||
private:
|
||||
InlineAdvisor &getAdvisor(const ModuleAnalysisManager &MAM,
|
||||
FunctionAnalysisManager &FAM, Module &M);
|
||||
std::unique_ptr<InlineAdvisor> OwnedAdvisor;
|
||||
const InlineParams Params;
|
||||
const InliningAdvisorMode Mode;
|
||||
};
|
||||
} // end namespace llvm
|
||||
|
||||
#endif // LLVM_TRANSFORMS_IPO_MODULEINLINER_H
|
|
@ -110,6 +110,7 @@
|
|||
#include "llvm/Transforms/IPO/LoopExtractor.h"
|
||||
#include "llvm/Transforms/IPO/LowerTypeTests.h"
|
||||
#include "llvm/Transforms/IPO/MergeFunctions.h"
|
||||
#include "llvm/Transforms/IPO/ModuleInliner.h"
|
||||
#include "llvm/Transforms/IPO/OpenMPOpt.h"
|
||||
#include "llvm/Transforms/IPO/PartialInlining.h"
|
||||
#include "llvm/Transforms/IPO/SCCP.h"
|
||||
|
|
|
@ -55,6 +55,7 @@
|
|||
#include "llvm/Transforms/IPO/Inliner.h"
|
||||
#include "llvm/Transforms/IPO/LowerTypeTests.h"
|
||||
#include "llvm/Transforms/IPO/MergeFunctions.h"
|
||||
#include "llvm/Transforms/IPO/ModuleInliner.h"
|
||||
#include "llvm/Transforms/IPO/OpenMPOpt.h"
|
||||
#include "llvm/Transforms/IPO/PartialInlining.h"
|
||||
#include "llvm/Transforms/IPO/SCCP.h"
|
||||
|
@ -153,6 +154,10 @@ static cl::opt<bool> EnableMemProfiler("enable-mem-prof", cl::init(false),
|
|||
cl::Hidden, cl::ZeroOrMore,
|
||||
cl::desc("Enable memory profiler"));
|
||||
|
||||
static cl::opt<bool> EnableModuleInliner("enable-module-inliner",
|
||||
cl::init(false), cl::Hidden,
|
||||
cl::desc("Enable module inliner"));
|
||||
|
||||
static cl::opt<bool> PerformMandatoryInliningsFirst(
|
||||
"mandatory-inlining-first", cl::init(true), cl::Hidden, cl::ZeroOrMore,
|
||||
cl::desc("Perform mandatory inlinings module-wide, before performing "
|
||||
|
@ -738,6 +743,28 @@ PassBuilder::buildInlinerPipeline(OptimizationLevel Level,
|
|||
return MIWP;
|
||||
}
|
||||
|
||||
ModuleInlinerPass
|
||||
PassBuilder::buildModuleInlinerPipeline(OptimizationLevel Level,
|
||||
ThinOrFullLTOPhase Phase) {
|
||||
InlineParams IP = getInlineParamsFromOptLevel(Level);
|
||||
if (Phase == ThinOrFullLTOPhase::ThinLTOPreLink && PGOOpt &&
|
||||
PGOOpt->Action == PGOOptions::SampleUse)
|
||||
IP.HotCallSiteThreshold = 0;
|
||||
|
||||
if (PGOOpt)
|
||||
IP.EnableDeferral = EnablePGOInlineDeferral;
|
||||
|
||||
// The inline deferral logic is used to avoid losing some
|
||||
// inlining chance in future. It is helpful in SCC inliner, in which
|
||||
// inlining is processed in bottom-up order.
|
||||
// While in module inliner, the inlining order is a priority-based order
|
||||
// by default. The inline deferral is unnecessary there. So we disable the
|
||||
// inline deferral logic in module inliner.
|
||||
IP.EnableDeferral = false;
|
||||
|
||||
return ModuleInlinerPass(IP, UseInlineAdvisor);
|
||||
}
|
||||
|
||||
ModulePassManager
|
||||
PassBuilder::buildModuleSimplificationPipeline(OptimizationLevel Level,
|
||||
ThinOrFullLTOPhase Phase) {
|
||||
|
@ -896,7 +923,10 @@ PassBuilder::buildModuleSimplificationPipeline(OptimizationLevel Level,
|
|||
if (EnableSyntheticCounts && !PGOOpt)
|
||||
MPM.addPass(SyntheticCountsPropagation());
|
||||
|
||||
MPM.addPass(buildInlinerPipeline(Level, Phase));
|
||||
if (EnableModuleInliner)
|
||||
MPM.addPass(buildModuleInlinerPipeline(Level, Phase));
|
||||
else
|
||||
MPM.addPass(buildInlinerPipeline(Level, Phase));
|
||||
|
||||
if (EnableMemProfiler && Phase != ThinOrFullLTOPhase::ThinLTOPreLink) {
|
||||
MPM.addPass(createModuleToFunctionPassAdaptor(MemProfilerPass()));
|
||||
|
|
|
@ -110,6 +110,7 @@ MODULE_PASS("verify", VerifierPass())
|
|||
MODULE_PASS("wholeprogramdevirt", WholeProgramDevirtPass())
|
||||
MODULE_PASS("dfsan", DataFlowSanitizerPass())
|
||||
MODULE_PASS("msan-module", ModuleMemorySanitizerPass({}))
|
||||
MODULE_PASS("module-inline", ModuleInlinerPass())
|
||||
MODULE_PASS("tsan-module", ModuleThreadSanitizerPass())
|
||||
MODULE_PASS("sancov-module", ModuleSanitizerCoveragePass())
|
||||
MODULE_PASS("memprof-module", ModuleMemProfilerPass())
|
||||
|
|
|
@ -29,6 +29,7 @@ add_llvm_component_library(LLVMipo
|
|||
LoopExtractor.cpp
|
||||
LowerTypeTests.cpp
|
||||
MergeFunctions.cpp
|
||||
ModuleInliner.cpp
|
||||
OpenMPOpt.cpp
|
||||
PartialInlining.cpp
|
||||
PassManagerBuilder.cpp
|
||||
|
|
|
@ -0,0 +1,354 @@
|
|||
//===- ModuleInliner.cpp - Code related to module inliner -----------------===//
|
||||
//
|
||||
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
||||
// See https://llvm.org/LICENSE.txt for license information.
|
||||
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
||||
//
|
||||
//===----------------------------------------------------------------------===//
|
||||
//
|
||||
// This file implements the mechanics required to implement inlining without
|
||||
// missing any calls in the module level. It doesn't need any infromation about
|
||||
// SCC or call graph, which is different from the SCC inliner. The decisions of
|
||||
// which calls are profitable to inline are implemented elsewhere.
|
||||
//
|
||||
//===----------------------------------------------------------------------===//
|
||||
|
||||
#include "llvm/Transforms/IPO/ModuleInliner.h"
|
||||
#include "llvm/ADT/DenseMap.h"
|
||||
#include "llvm/ADT/ScopeExit.h"
|
||||
#include "llvm/ADT/SetVector.h"
|
||||
#include "llvm/ADT/SmallPtrSet.h"
|
||||
#include "llvm/ADT/SmallVector.h"
|
||||
#include "llvm/ADT/Statistic.h"
|
||||
#include "llvm/Analysis/AssumptionCache.h"
|
||||
#include "llvm/Analysis/BlockFrequencyInfo.h"
|
||||
#include "llvm/Analysis/GlobalsModRef.h"
|
||||
#include "llvm/Analysis/InlineAdvisor.h"
|
||||
#include "llvm/Analysis/InlineCost.h"
|
||||
#include "llvm/Analysis/InlineOrder.h"
|
||||
#include "llvm/Analysis/OptimizationRemarkEmitter.h"
|
||||
#include "llvm/Analysis/ProfileSummaryInfo.h"
|
||||
#include "llvm/Analysis/TargetLibraryInfo.h"
|
||||
#include "llvm/Analysis/TargetTransformInfo.h"
|
||||
#include "llvm/IR/DebugLoc.h"
|
||||
#include "llvm/IR/DiagnosticInfo.h"
|
||||
#include "llvm/IR/Function.h"
|
||||
#include "llvm/IR/InstIterator.h"
|
||||
#include "llvm/IR/Instruction.h"
|
||||
#include "llvm/IR/Instructions.h"
|
||||
#include "llvm/IR/IntrinsicInst.h"
|
||||
#include "llvm/IR/Metadata.h"
|
||||
#include "llvm/IR/Module.h"
|
||||
#include "llvm/IR/PassManager.h"
|
||||
#include "llvm/IR/User.h"
|
||||
#include "llvm/IR/Value.h"
|
||||
#include "llvm/Support/CommandLine.h"
|
||||
#include "llvm/Support/Debug.h"
|
||||
#include "llvm/Support/raw_ostream.h"
|
||||
#include "llvm/Transforms/Utils/CallPromotionUtils.h"
|
||||
#include "llvm/Transforms/Utils/Cloning.h"
|
||||
#include "llvm/Transforms/Utils/Local.h"
|
||||
#include "llvm/Transforms/Utils/ModuleUtils.h"
|
||||
#include <cassert>
|
||||
#include <functional>
|
||||
|
||||
using namespace llvm;
|
||||
|
||||
#define DEBUG_TYPE "module-inline"
|
||||
|
||||
STATISTIC(NumInlined, "Number of functions inlined");
|
||||
STATISTIC(NumDeleted, "Number of functions deleted because all callers found");
|
||||
|
||||
static cl::opt<bool> InlineEnablePriorityOrder(
|
||||
"module-inline-enable-priority-order", cl::Hidden, cl::init(true),
|
||||
cl::desc("Enable the priority inline order for the module inliner"));
|
||||
|
||||
/// Return true if the specified inline history ID
|
||||
/// indicates an inline history that includes the specified function.
|
||||
static bool inlineHistoryIncludes(
|
||||
Function *F, int InlineHistoryID,
|
||||
const SmallVectorImpl<std::pair<Function *, int>> &InlineHistory) {
|
||||
while (InlineHistoryID != -1) {
|
||||
assert(unsigned(InlineHistoryID) < InlineHistory.size() &&
|
||||
"Invalid inline history ID");
|
||||
if (InlineHistory[InlineHistoryID].first == F)
|
||||
return true;
|
||||
InlineHistoryID = InlineHistory[InlineHistoryID].second;
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
InlineAdvisor &ModuleInlinerPass::getAdvisor(const ModuleAnalysisManager &MAM,
|
||||
FunctionAnalysisManager &FAM,
|
||||
Module &M) {
|
||||
if (OwnedAdvisor)
|
||||
return *OwnedAdvisor;
|
||||
|
||||
auto *IAA = MAM.getCachedResult<InlineAdvisorAnalysis>(M);
|
||||
if (!IAA) {
|
||||
// It should still be possible to run the inliner as a stand-alone module
|
||||
// pass, for test scenarios. In that case, we default to the
|
||||
// DefaultInlineAdvisor, which doesn't need to keep state between module
|
||||
// pass runs. It also uses just the default InlineParams. In this case, we
|
||||
// need to use the provided FAM, which is valid for the duration of the
|
||||
// inliner pass, and thus the lifetime of the owned advisor. The one we
|
||||
// would get from the MAM can be invalidated as a result of the inliner's
|
||||
// activity.
|
||||
OwnedAdvisor = std::make_unique<DefaultInlineAdvisor>(M, FAM, Params);
|
||||
|
||||
return *OwnedAdvisor;
|
||||
}
|
||||
assert(IAA->getAdvisor() &&
|
||||
"Expected a present InlineAdvisorAnalysis also have an "
|
||||
"InlineAdvisor initialized");
|
||||
return *IAA->getAdvisor();
|
||||
}
|
||||
|
||||
static bool isKnownLibFunction(Function &F, TargetLibraryInfo &TLI) {
|
||||
LibFunc LF;
|
||||
|
||||
// Either this is a normal library function or a "vectorizable"
|
||||
// function. Not using the VFDatabase here because this query
|
||||
// is related only to libraries handled via the TLI.
|
||||
return TLI.getLibFunc(F, LF) ||
|
||||
TLI.isKnownVectorFunctionInLibrary(F.getName());
|
||||
}
|
||||
|
||||
PreservedAnalyses ModuleInlinerPass::run(Module &M,
|
||||
ModuleAnalysisManager &MAM) {
|
||||
LLVM_DEBUG(dbgs() << "---- Module Inliner is Running ---- \n");
|
||||
|
||||
auto &IAA = MAM.getResult<InlineAdvisorAnalysis>(M);
|
||||
if (!IAA.tryCreate(Params, Mode, {})) {
|
||||
M.getContext().emitError(
|
||||
"Could not setup Inlining Advisor for the requested "
|
||||
"mode and/or options");
|
||||
return PreservedAnalyses::all();
|
||||
}
|
||||
|
||||
bool Changed = false;
|
||||
|
||||
ProfileSummaryInfo *PSI = MAM.getCachedResult<ProfileSummaryAnalysis>(M);
|
||||
|
||||
FunctionAnalysisManager &FAM =
|
||||
MAM.getResult<FunctionAnalysisManagerModuleProxy>(M).getManager();
|
||||
|
||||
auto GetTLI = [&FAM](Function &F) -> TargetLibraryInfo & {
|
||||
return FAM.getResult<TargetLibraryAnalysis>(F);
|
||||
};
|
||||
|
||||
InlineAdvisor &Advisor = getAdvisor(MAM, FAM, M);
|
||||
Advisor.onPassEntry();
|
||||
|
||||
auto AdvisorOnExit = make_scope_exit([&] { Advisor.onPassExit(); });
|
||||
|
||||
// In the module inliner, a priority-based worklist is used for calls across
|
||||
// the entire Module. With this module inliner, the inline order is not
|
||||
// limited to bottom-up order. More globally scope inline order is enabled.
|
||||
// Also, the inline deferral logic become unnecessary in this module inliner.
|
||||
// It is possible to use other priority heuristics, e.g. profile-based
|
||||
// heuristic.
|
||||
//
|
||||
// TODO: Here is a huge amount duplicate code between the module inliner and
|
||||
// the SCC inliner, which need some refactoring.
|
||||
std::unique_ptr<InlineOrder<std::pair<CallBase *, int>>> Calls;
|
||||
if (InlineEnablePriorityOrder)
|
||||
Calls = std::make_unique<PriorityInlineOrder<InlineSizePriority>>();
|
||||
else
|
||||
Calls = std::make_unique<DefaultInlineOrder<std::pair<CallBase *, int>>>();
|
||||
assert(Calls != nullptr && "Expected an initialized InlineOrder");
|
||||
|
||||
// Populate the initial list of calls in this module.
|
||||
for (Function &F : M) {
|
||||
auto &ORE = FAM.getResult<OptimizationRemarkEmitterAnalysis>(F);
|
||||
// We want to generally process call sites top-down in order for
|
||||
// simplifications stemming from replacing the call with the returned value
|
||||
// after inlining to be visible to subsequent inlining decisions.
|
||||
// FIXME: Using instructions sequence is a really bad way to do this.
|
||||
// Instead we should do an actual RPO walk of the function body.
|
||||
for (Instruction &I : instructions(F))
|
||||
if (auto *CB = dyn_cast<CallBase>(&I))
|
||||
if (Function *Callee = CB->getCalledFunction()) {
|
||||
if (!Callee->isDeclaration())
|
||||
Calls->push({CB, -1});
|
||||
else if (!isa<IntrinsicInst>(I)) {
|
||||
using namespace ore;
|
||||
setInlineRemark(*CB, "unavailable definition");
|
||||
ORE.emit([&]() {
|
||||
return OptimizationRemarkMissed(DEBUG_TYPE, "NoDefinition", &I)
|
||||
<< NV("Callee", Callee) << " will not be inlined into "
|
||||
<< NV("Caller", CB->getCaller())
|
||||
<< " because its definition is unavailable"
|
||||
<< setIsVerbose();
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
if (Calls->empty())
|
||||
return PreservedAnalyses::all();
|
||||
|
||||
// When inlining a callee produces new call sites, we want to keep track of
|
||||
// the fact that they were inlined from the callee. This allows us to avoid
|
||||
// infinite inlining in some obscure cases. To represent this, we use an
|
||||
// index into the InlineHistory vector.
|
||||
SmallVector<std::pair<Function *, int>, 16> InlineHistory;
|
||||
|
||||
// Track a set vector of inlined callees so that we can augment the caller
|
||||
// with all of their edges in the call graph before pruning out the ones that
|
||||
// got simplified away.
|
||||
SmallSetVector<Function *, 4> InlinedCallees;
|
||||
|
||||
// Track the dead functions to delete once finished with inlining calls. We
|
||||
// defer deleting these to make it easier to handle the call graph updates.
|
||||
SmallVector<Function *, 4> DeadFunctions;
|
||||
|
||||
// Loop forward over all of the calls.
|
||||
while (!Calls->empty()) {
|
||||
// We expect the calls to typically be batched with sequences of calls that
|
||||
// have the same caller, so we first set up some shared infrastructure for
|
||||
// this caller. We also do any pruning we can at this layer on the caller
|
||||
// alone.
|
||||
Function &F = *Calls->front().first->getCaller();
|
||||
|
||||
LLVM_DEBUG(dbgs() << "Inlining calls in: " << F.getName() << "\n"
|
||||
<< " Function size: " << F.getInstructionCount()
|
||||
<< "\n");
|
||||
|
||||
auto GetAssumptionCache = [&](Function &F) -> AssumptionCache & {
|
||||
return FAM.getResult<AssumptionAnalysis>(F);
|
||||
};
|
||||
|
||||
// Now process as many calls as we have within this caller in the sequence.
|
||||
// We bail out as soon as the caller has to change so we can
|
||||
// prepare the context of that new caller.
|
||||
bool DidInline = false;
|
||||
while (!Calls->empty() && Calls->front().first->getCaller() == &F) {
|
||||
auto P = Calls->pop();
|
||||
CallBase *CB = P.first;
|
||||
const int InlineHistoryID = P.second;
|
||||
Function &Callee = *CB->getCalledFunction();
|
||||
|
||||
if (InlineHistoryID != -1 &&
|
||||
inlineHistoryIncludes(&Callee, InlineHistoryID, InlineHistory)) {
|
||||
setInlineRemark(*CB, "recursive");
|
||||
continue;
|
||||
}
|
||||
|
||||
auto Advice = Advisor.getAdvice(*CB, /*OnlyMandatory*/ false);
|
||||
// Check whether we want to inline this callsite.
|
||||
if (!Advice->isInliningRecommended()) {
|
||||
Advice->recordUnattemptedInlining();
|
||||
continue;
|
||||
}
|
||||
|
||||
// Setup the data structure used to plumb customization into the
|
||||
// `InlineFunction` routine.
|
||||
InlineFunctionInfo IFI(
|
||||
/*cg=*/nullptr, GetAssumptionCache, PSI,
|
||||
&FAM.getResult<BlockFrequencyAnalysis>(*(CB->getCaller())),
|
||||
&FAM.getResult<BlockFrequencyAnalysis>(Callee));
|
||||
|
||||
InlineResult IR =
|
||||
InlineFunction(*CB, IFI, &FAM.getResult<AAManager>(*CB->getCaller()));
|
||||
if (!IR.isSuccess()) {
|
||||
Advice->recordUnsuccessfulInlining(IR);
|
||||
continue;
|
||||
}
|
||||
|
||||
DidInline = true;
|
||||
InlinedCallees.insert(&Callee);
|
||||
++NumInlined;
|
||||
|
||||
LLVM_DEBUG(dbgs() << " Size after inlining: "
|
||||
<< F.getInstructionCount() << "\n");
|
||||
|
||||
// Add any new callsites to defined functions to the worklist.
|
||||
if (!IFI.InlinedCallSites.empty()) {
|
||||
int NewHistoryID = InlineHistory.size();
|
||||
InlineHistory.push_back({&Callee, InlineHistoryID});
|
||||
|
||||
for (CallBase *ICB : reverse(IFI.InlinedCallSites)) {
|
||||
Function *NewCallee = ICB->getCalledFunction();
|
||||
if (!NewCallee) {
|
||||
// Try to promote an indirect (virtual) call without waiting for
|
||||
// the post-inline cleanup and the next DevirtSCCRepeatedPass
|
||||
// iteration because the next iteration may not happen and we may
|
||||
// miss inlining it.
|
||||
if (tryPromoteCall(*ICB))
|
||||
NewCallee = ICB->getCalledFunction();
|
||||
}
|
||||
if (NewCallee)
|
||||
if (!NewCallee->isDeclaration())
|
||||
Calls->push({ICB, NewHistoryID});
|
||||
}
|
||||
}
|
||||
|
||||
// Merge the attributes based on the inlining.
|
||||
AttributeFuncs::mergeAttributesForInlining(F, Callee);
|
||||
|
||||
// For local functions, check whether this makes the callee trivially
|
||||
// dead. In that case, we can drop the body of the function eagerly
|
||||
// which may reduce the number of callers of other functions to one,
|
||||
// changing inline cost thresholds.
|
||||
bool CalleeWasDeleted = false;
|
||||
if (Callee.hasLocalLinkage()) {
|
||||
// To check this we also need to nuke any dead constant uses (perhaps
|
||||
// made dead by this operation on other functions).
|
||||
Callee.removeDeadConstantUsers();
|
||||
// if (Callee.use_empty() && !CG.isLibFunction(Callee)) {
|
||||
if (Callee.use_empty() && !isKnownLibFunction(Callee, GetTLI(Callee))) {
|
||||
Calls->erase_if([&](const std::pair<CallBase *, int> &Call) {
|
||||
return Call.first->getCaller() == &Callee;
|
||||
});
|
||||
// Clear the body and queue the function itself for deletion when we
|
||||
// finish inlining.
|
||||
// Note that after this point, it is an error to do anything other
|
||||
// than use the callee's address or delete it.
|
||||
Callee.dropAllReferences();
|
||||
assert(!is_contained(DeadFunctions, &Callee) &&
|
||||
"Cannot put cause a function to become dead twice!");
|
||||
DeadFunctions.push_back(&Callee);
|
||||
CalleeWasDeleted = true;
|
||||
}
|
||||
}
|
||||
if (CalleeWasDeleted)
|
||||
Advice->recordInliningWithCalleeDeleted();
|
||||
else
|
||||
Advice->recordInlining();
|
||||
}
|
||||
|
||||
if (!DidInline)
|
||||
continue;
|
||||
Changed = true;
|
||||
|
||||
InlinedCallees.clear();
|
||||
}
|
||||
|
||||
// Now that we've finished inlining all of the calls across this module,
|
||||
// delete all of the trivially dead functions.
|
||||
//
|
||||
// Note that this walks a pointer set which has non-deterministic order but
|
||||
// that is OK as all we do is delete things and add pointers to unordered
|
||||
// sets.
|
||||
for (Function *DeadF : DeadFunctions) {
|
||||
// Clear out any cached analyses.
|
||||
FAM.clear(*DeadF, DeadF->getName());
|
||||
|
||||
// And delete the actual function from the module.
|
||||
// The Advisor may use Function pointers to efficiently index various
|
||||
// internal maps, e.g. for memoization. Function cleanup passes like
|
||||
// argument promotion create new functions. It is possible for a new
|
||||
// function to be allocated at the address of a deleted function. We could
|
||||
// index using names, but that's inefficient. Alternatively, we let the
|
||||
// Advisor free the functions when it sees fit.
|
||||
DeadF->getBasicBlockList().clear();
|
||||
M.getFunctionList().remove(DeadF);
|
||||
|
||||
++NumDeleted;
|
||||
}
|
||||
|
||||
if (!Changed)
|
||||
return PreservedAnalyses::all();
|
||||
|
||||
return PreservedAnalyses::none();
|
||||
}
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt -inline -S < %s | FileCheck %s
|
||||
; RUN: opt -passes='cgscc(inline)' -S < %s | FileCheck %s
|
||||
; RUN: opt -passes='module-inline' -S < %s | FileCheck %s
|
||||
|
||||
define dso_local i32 @main() #0 {
|
||||
%1 = alloca i32, align 4
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt < %s -inline -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='cgscc(inline)' -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='module-inline' -S | FileCheck %s
|
||||
|
||||
define i32 @testByte(i8 %X) {
|
||||
entry:
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt -inline -S < %s | FileCheck %s
|
||||
; RUN: opt -passes='cgscc(inline)' -S < %s | FileCheck %s
|
||||
; RUN: opt -passes='module-inline' -S < %s | FileCheck %s
|
||||
|
||||
define i32 @caller() {
|
||||
; CHECK-LABEL: @caller(
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt < %s -inline -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='cgscc(inline)' -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='module-inline' -S | FileCheck %s
|
||||
|
||||
; InlineFunction would assert inside the loop that leaves lifetime markers if
|
||||
; there was an zero-sized AllocaInst. Check that it doesn't assert and doesn't
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt -inline -S < %s | FileCheck %s
|
||||
; RUN: opt -passes='cgscc(inline)' -S < %s | FileCheck %s
|
||||
; RUN: opt -passes='module-inline' -S < %s | FileCheck %s
|
||||
|
||||
; PR23216: We can't inline functions using llvm.localescape.
|
||||
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt -inline -S -o - < %s | FileCheck %s
|
||||
; RUN: opt -passes='cgscc(inline)' -S < %s | FileCheck %s
|
||||
; RUN: opt -passes='module-inline' -S < %s | FileCheck %s
|
||||
|
||||
%0 = type opaque
|
||||
%struct.Foo = type { i32, %0* }
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt -S -inline < %s | FileCheck %s
|
||||
; RUN: opt -S -passes='cgscc(inline)' < %s | FileCheck %s
|
||||
; RUN: opt -S -passes='module-inline' < %s | FileCheck %s
|
||||
|
||||
target datalayout = "e-p3:32:32-p4:64:64-n32"
|
||||
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt < %s -S -inline -inline-threshold=20 | FileCheck %s
|
||||
; RUN: opt < %s -S -passes='cgscc(inline)' -inline-threshold=20 | FileCheck %s
|
||||
; RUN: opt < %s -S -passes='module-inline' -inline-threshold=20 | FileCheck %s
|
||||
; Check that we don't drop FastMathFlag when estimating inlining profitability.
|
||||
;
|
||||
; In this test we should inline 'foo' to 'boo', because it'll fold to a
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt -S -inline %s -o - | FileCheck %s
|
||||
; RUN: opt -S -passes='cgscc(inline)' %s -o - | FileCheck %s
|
||||
; RUN: opt -S -passes='module-inline' %s -o - | FileCheck %s
|
||||
|
||||
; Check that memcpy2 is completely inlined away.
|
||||
; CHECK-NOT: memcpy2
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt %s -inline -S | FileCheck %s
|
||||
; RUN: opt %s -passes='cgscc(inline)' -S | FileCheck %s
|
||||
; RUN: opt %s -passes='module-inline' -S | FileCheck %s
|
||||
|
||||
declare void @external_func()
|
||||
|
||||
|
|
|
@ -1,4 +1,5 @@
|
|||
; RUN: opt %s -passes='cgscc(inline)' -S | FileCheck %s
|
||||
; RUN: opt %s -passes='module-inline' -S | FileCheck %s
|
||||
|
||||
declare void @external_func()
|
||||
declare void @abort()
|
||||
|
|
|
@ -3,6 +3,7 @@
|
|||
|
||||
; RUN: opt < %s -inline -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='cgscc(inline)' -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='module-inline' -S | FileCheck %s
|
||||
|
||||
declare void @might_throw()
|
||||
|
||||
|
|
|
@ -3,6 +3,7 @@
|
|||
|
||||
; RUN: opt < %s -inline -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='cgscc(inline)' -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='module-inline' -S | FileCheck %s
|
||||
|
||||
declare void @might_throw()
|
||||
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt < %s -inline -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='cgscc(inline)' -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='module-inline' -S | FileCheck %s
|
||||
; Test that bar and bar2 are both inlined throughout and removed.
|
||||
@A = weak global i32 0 ; <i32*> [#uses=1]
|
||||
@B = weak global i32 0 ; <i32*> [#uses=1]
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt -S -inline %s | FileCheck %s
|
||||
; RUN: opt -S -passes='cgscc(inline)' %s | FileCheck %s
|
||||
; RUN: opt -S -passes='module-inline' %s | FileCheck %s
|
||||
|
||||
declare void @foo()
|
||||
declare void @bar()
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; RUN: opt < %s -inline -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='cgscc(inline)' -S | FileCheck %s
|
||||
; RUN: opt < %s -passes='module-inline' -S | FileCheck %s
|
||||
|
||||
$c = comdat any
|
||||
; CHECK: $c = comdat any
|
||||
|
|
Loading…
Reference in New Issue