lib/Analysis/MLInlineAdvisor.cpp

097a140dSpatrick//===- MLInlineAdvisor.cpp - machine learned InlineAdvisor ----------------===//
097a140dSpatrick//
097a140dSpatrick// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
097a140dSpatrick// See https://llvm.org/LICENSE.txt for license information.
097a140dSpatrick// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
097a140dSpatrick//
097a140dSpatrick//===----------------------------------------------------------------------===//
097a140dSpatrick//
097a140dSpatrick// This file implements the interface between the inliner and a learned model.
097a140dSpatrick// It delegates model evaluation to either the AOT compiled model (the
097a140dSpatrick// 'release' mode) or a runtime-loaded model (the 'development' case).
097a140dSpatrick//
097a140dSpatrick//===----------------------------------------------------------------------===//
*d415bd75Srobert#include "llvm/Analysis/MLInlineAdvisor.h"
097a140dSpatrick#include "llvm/ADT/SCCIterator.h"
*d415bd75Srobert#include "llvm/Analysis/AssumptionCache.h"
097a140dSpatrick#include "llvm/Analysis/CallGraph.h"
73471bf0Spatrick#include "llvm/Analysis/FunctionPropertiesAnalysis.h"
097a140dSpatrick#include "llvm/Analysis/InlineCost.h"
*d415bd75Srobert#include "llvm/Analysis/InlineModelFeatureMaps.h"
*d415bd75Srobert#include "llvm/Analysis/LazyCallGraph.h"
*d415bd75Srobert#include "llvm/Analysis/LoopInfo.h"
097a140dSpatrick#include "llvm/Analysis/MLModelRunner.h"
097a140dSpatrick#include "llvm/Analysis/OptimizationRemarkEmitter.h"
097a140dSpatrick#include "llvm/Analysis/TargetTransformInfo.h"
*d415bd75Srobert#include "llvm/IR/Dominators.h"
097a140dSpatrick#include "llvm/IR/InstIterator.h"
097a140dSpatrick#include "llvm/IR/PassManager.h"
097a140dSpatrick#include "llvm/Support/CommandLine.h"
097a140dSpatrick
097a140dSpatrickusing namespace llvm;
097a140dSpatrick
*d415bd75Srobert#if defined(LLVM_HAVE_TF_AOT_INLINERSIZEMODEL)
*d415bd75Srobert#include "llvm/Analysis/ReleaseModeModelRunner.h"
*d415bd75Srobert// codegen-ed file
*d415bd75Srobert#include "InlinerSizeModel.h" // NOLINT
*d415bd75Srobert
*d415bd75Srobertstd::unique_ptr<InlineAdvisor>
*d415bd75Srobertllvm::getReleaseModeAdvisor(Module &M, ModuleAnalysisManager &MAM) {
*d415bd75Srobert  auto AOTRunner =
*d415bd75Srobert      std::make_unique<ReleaseModeModelRunner<llvm::InlinerSizeModel>>(
*d415bd75Srobert          M.getContext(), FeatureMap, DecisionName);
*d415bd75Srobert  return std::make_unique<MLInlineAdvisor>(M, MAM, std::move(AOTRunner));
*d415bd75Srobert}
*d415bd75Srobert#endif
*d415bd75Srobert
097a140dSpatrick#define DEBUG_TYPE "inline-ml"
097a140dSpatrick
097a140dSpatrickstatic cl::opt<float> SizeIncreaseThreshold(
097a140dSpatrick    "ml-advisor-size-increase-threshold", cl::Hidden,
097a140dSpatrick    cl::desc("Maximum factor by which expected native size may increase before "
097a140dSpatrick             "blocking any further inlining."),
097a140dSpatrick    cl::init(2.0));
097a140dSpatrick
*d415bd75Srobertstatic cl::opt<bool> KeepFPICache(
*d415bd75Srobert    "ml-advisor-keep-fpi-cache", cl::Hidden,
*d415bd75Srobert    cl::desc(
*d415bd75Srobert        "For test - keep the ML Inline advisor's FunctionPropertiesInfo cache"),
*d415bd75Srobert    cl::init(false));
*d415bd75Srobert
73471bf0Spatrick// clang-format off
*d415bd75Srobertconst std::array<TensorSpec, NumberOfFeatures> llvm::FeatureMap{
*d415bd75Srobert#define POPULATE_NAMES(_, NAME) TensorSpec::createSpec<int64_t>(NAME, {1} ),
73471bf0Spatrick// InlineCost features - these must come first
73471bf0Spatrick  INLINE_COST_FEATURE_ITERATOR(POPULATE_NAMES)
73471bf0Spatrick#undef POPULATE_NAMES
73471bf0Spatrick
73471bf0Spatrick// Non-cost features
*d415bd75Srobert#define POPULATE_NAMES(_, NAME, __) TensorSpec::createSpec<int64_t>(NAME, {1} ),
097a140dSpatrick  INLINE_FEATURE_ITERATOR(POPULATE_NAMES)
097a140dSpatrick#undef POPULATE_NAMES
097a140dSpatrick};
73471bf0Spatrick// clang-format on
097a140dSpatrick
097a140dSpatrickconst char *const llvm::DecisionName = "inlining_decision";
097a140dSpatrickconst char *const llvm::DefaultDecisionName = "inlining_default";
097a140dSpatrickconst char *const llvm::RewardName = "delta_size";
097a140dSpatrick
097a140dSpatrickCallBase *getInlinableCS(Instruction &I) {
097a140dSpatrick  if (auto *CS = dyn_cast<CallBase>(&I))
097a140dSpatrick    if (Function *Callee = CS->getCalledFunction()) {
097a140dSpatrick      if (!Callee->isDeclaration()) {
097a140dSpatrick        return CS;
097a140dSpatrick      }
097a140dSpatrick    }
097a140dSpatrick  return nullptr;
097a140dSpatrick}
097a140dSpatrick
097a140dSpatrickMLInlineAdvisor::MLInlineAdvisor(Module &M, ModuleAnalysisManager &MAM,
097a140dSpatrick                                 std::unique_ptr<MLModelRunner> Runner)
097a140dSpatrick    : InlineAdvisor(
73471bf0Spatrick          M, MAM.getResult<FunctionAnalysisManagerModuleProxy>(M).getManager()),
*d415bd75Srobert      ModelRunner(std::move(Runner)),
*d415bd75Srobert      CG(MAM.getResult<LazyCallGraphAnalysis>(M)),
097a140dSpatrick      InitialIRSize(getModuleIRSize()), CurrentIRSize(InitialIRSize) {
097a140dSpatrick  assert(ModelRunner);
097a140dSpatrick
097a140dSpatrick  // Extract the 'call site height' feature - the position of a call site
097a140dSpatrick  // relative to the farthest statically reachable SCC node. We don't mutate
097a140dSpatrick  // this value while inlining happens. Empirically, this feature proved
097a140dSpatrick  // critical in behavioral cloning - i.e. training a model to mimic the manual
097a140dSpatrick  // heuristic's decisions - and, thus, equally important for training for
097a140dSpatrick  // improvement.
*d415bd75Srobert  CallGraph CGraph(M);
*d415bd75Srobert  for (auto I = scc_begin(&CGraph); !I.isAtEnd(); ++I) {
097a140dSpatrick    const std::vector<CallGraphNode *> &CGNodes = *I;
097a140dSpatrick    unsigned Level = 0;
097a140dSpatrick    for (auto *CGNode : CGNodes) {
097a140dSpatrick      Function *F = CGNode->getFunction();
097a140dSpatrick      if (!F || F->isDeclaration())
097a140dSpatrick        continue;
097a140dSpatrick      for (auto &I : instructions(F)) {
097a140dSpatrick        if (auto *CS = getInlinableCS(I)) {
097a140dSpatrick          auto *Called = CS->getCalledFunction();
*d415bd75Srobert          auto Pos = FunctionLevels.find(&CG.get(*Called));
097a140dSpatrick          // In bottom up traversal, an inlinable callee is either in the
097a140dSpatrick          // same SCC, or to a function in a visited SCC. So not finding its
097a140dSpatrick          // level means we haven't visited it yet, meaning it's in this SCC.
097a140dSpatrick          if (Pos == FunctionLevels.end())
097a140dSpatrick            continue;
097a140dSpatrick          Level = std::max(Level, Pos->second + 1);
097a140dSpatrick        }
097a140dSpatrick      }
097a140dSpatrick    }
097a140dSpatrick    for (auto *CGNode : CGNodes) {
097a140dSpatrick      Function *F = CGNode->getFunction();
097a140dSpatrick      if (F && !F->isDeclaration())
*d415bd75Srobert        FunctionLevels[&CG.get(*F)] = Level;
097a140dSpatrick    }
097a140dSpatrick  }
*d415bd75Srobert  for (auto KVP : FunctionLevels) {
*d415bd75Srobert    AllNodes.insert(KVP.first);
*d415bd75Srobert    EdgeCount += getLocalCalls(KVP.first->getFunction());
*d415bd75Srobert  }
*d415bd75Srobert  NodeCount = AllNodes.size();
*d415bd75Srobert}
*d415bd75Srobert
*d415bd75Srobertunsigned MLInlineAdvisor::getInitialFunctionLevel(const Function &F) const {
*d415bd75Srobert  return CG.lookup(F) ? FunctionLevels.at(CG.lookup(F)) : 0;
*d415bd75Srobert}
*d415bd75Srobert
*d415bd75Srobertvoid MLInlineAdvisor::onPassEntry(LazyCallGraph::SCC *LastSCC) {
*d415bd75Srobert  if (!LastSCC || ForceStop)
*d415bd75Srobert    return;
*d415bd75Srobert  FPICache.clear();
*d415bd75Srobert  // Function passes executed between InlinerPass runs may have changed the
*d415bd75Srobert  // module-wide features.
*d415bd75Srobert  // The cgscc pass manager rules are such that:
*d415bd75Srobert  // - if a pass leads to merging SCCs, then the pipeline is restarted on the
*d415bd75Srobert  // merged SCC
*d415bd75Srobert  // - if a pass leads to splitting the SCC, then we continue with one of the
*d415bd75Srobert  // splits
*d415bd75Srobert  // This means that the NodesInLastSCC is a superset (not strict) of the nodes
*d415bd75Srobert  // that subsequent passes would have processed
*d415bd75Srobert  // - in addition, if new Nodes were created by a pass (e.g. CoroSplit),
*d415bd75Srobert  // they'd be adjacent to Nodes in the last SCC. So we just need to check the
*d415bd75Srobert  // boundary of Nodes in NodesInLastSCC for Nodes we haven't seen. We don't
*d415bd75Srobert  // care about the nature of the Edge (call or ref).
*d415bd75Srobert  NodeCount -= static_cast<int64_t>(NodesInLastSCC.size());
*d415bd75Srobert  while (!NodesInLastSCC.empty()) {
*d415bd75Srobert    const auto *N = *NodesInLastSCC.begin();
*d415bd75Srobert    NodesInLastSCC.erase(N);
*d415bd75Srobert    // The Function wrapped by N could have been deleted since we last saw it.
*d415bd75Srobert    if (N->isDead()) {
*d415bd75Srobert      assert(!N->getFunction().isDeclaration());
*d415bd75Srobert      continue;
*d415bd75Srobert    }
*d415bd75Srobert    ++NodeCount;
*d415bd75Srobert    EdgeCount += getLocalCalls(N->getFunction());
*d415bd75Srobert    for (const auto &E : *(*N)) {
*d415bd75Srobert      const auto *AdjNode = &E.getNode();
*d415bd75Srobert      assert(!AdjNode->isDead() && !AdjNode->getFunction().isDeclaration());
*d415bd75Srobert      auto I = AllNodes.insert(AdjNode);
*d415bd75Srobert      if (I.second)
*d415bd75Srobert        NodesInLastSCC.insert(AdjNode);
*d415bd75Srobert    }
097a140dSpatrick  }
097a140dSpatrick
*d415bd75Srobert  EdgeCount -= EdgesOfLastSeenNodes;
*d415bd75Srobert  EdgesOfLastSeenNodes = 0;
*d415bd75Srobert
*d415bd75Srobert  // (Re)use NodesInLastSCC to remember the nodes in the SCC right now,
*d415bd75Srobert  // in case the SCC is split before onPassExit and some nodes are split out
*d415bd75Srobert  assert(NodesInLastSCC.empty());
*d415bd75Srobert  for (const auto &N : *LastSCC)
*d415bd75Srobert    NodesInLastSCC.insert(&N);
097a140dSpatrick}
*d415bd75Srobert
*d415bd75Srobertvoid MLInlineAdvisor::onPassExit(LazyCallGraph::SCC *LastSCC) {
*d415bd75Srobert  // No need to keep this around - function passes will invalidate it.
*d415bd75Srobert  if (!KeepFPICache)
*d415bd75Srobert    FPICache.clear();
*d415bd75Srobert  if (!LastSCC || ForceStop)
*d415bd75Srobert    return;
*d415bd75Srobert  // Keep track of the nodes and edges we last saw. Then, in onPassEntry,
*d415bd75Srobert  // we update the node count and edge count from the subset of these nodes that
*d415bd75Srobert  // survived.
*d415bd75Srobert  EdgesOfLastSeenNodes = 0;
*d415bd75Srobert
*d415bd75Srobert  // Check on nodes that were in SCC onPassEntry
*d415bd75Srobert  for (auto I = NodesInLastSCC.begin(); I != NodesInLastSCC.end();) {
*d415bd75Srobert    if ((*I)->isDead())
*d415bd75Srobert      NodesInLastSCC.erase(*I++);
*d415bd75Srobert    else
*d415bd75Srobert      EdgesOfLastSeenNodes += getLocalCalls((*I++)->getFunction());
*d415bd75Srobert  }
*d415bd75Srobert
*d415bd75Srobert  // Check on nodes that may have got added to SCC
*d415bd75Srobert  for (const auto &N : *LastSCC) {
*d415bd75Srobert    assert(!N.isDead());
*d415bd75Srobert    auto I = NodesInLastSCC.insert(&N);
*d415bd75Srobert    if (I.second)
*d415bd75Srobert      EdgesOfLastSeenNodes += getLocalCalls(N.getFunction());
*d415bd75Srobert  }
*d415bd75Srobert  assert(NodeCount >= NodesInLastSCC.size());
*d415bd75Srobert  assert(EdgeCount >= EdgesOfLastSeenNodes);
097a140dSpatrick}
097a140dSpatrick
097a140dSpatrickint64_t MLInlineAdvisor::getLocalCalls(Function &F) {
*d415bd75Srobert  return getCachedFPI(F).DirectCallsToDefinedFunctions;
097a140dSpatrick}
097a140dSpatrick
097a140dSpatrick// Update the internal state of the advisor, and force invalidate feature
097a140dSpatrick// analysis. Currently, we maintain minimal (and very simple) global state - the
097a140dSpatrick// number of functions and the number of static calls. We also keep track of the
097a140dSpatrick// total IR size in this module, to stop misbehaving policies at a certain bloat
097a140dSpatrick// factor (SizeIncreaseThreshold)
097a140dSpatrickvoid MLInlineAdvisor::onSuccessfulInlining(const MLInlineAdvice &Advice,
097a140dSpatrick                                           bool CalleeWasDeleted) {
097a140dSpatrick  assert(!ForceStop);
097a140dSpatrick  Function *Caller = Advice.getCaller();
097a140dSpatrick  Function *Callee = Advice.getCallee();
097a140dSpatrick  // The caller features aren't valid anymore.
73471bf0Spatrick  {
73471bf0Spatrick    PreservedAnalyses PA = PreservedAnalyses::all();
73471bf0Spatrick    PA.abandon<FunctionPropertiesAnalysis>();
*d415bd75Srobert    PA.abandon<DominatorTreeAnalysis>();
*d415bd75Srobert    PA.abandon<LoopAnalysis>();
73471bf0Spatrick    FAM.invalidate(*Caller, PA);
73471bf0Spatrick  }
*d415bd75Srobert  Advice.updateCachedCallerFPI(FAM);
097a140dSpatrick  int64_t IRSizeAfter =
097a140dSpatrick      getIRSize(*Caller) + (CalleeWasDeleted ? 0 : Advice.CalleeIRSize);
097a140dSpatrick  CurrentIRSize += IRSizeAfter - (Advice.CallerIRSize + Advice.CalleeIRSize);
097a140dSpatrick  if (CurrentIRSize > SizeIncreaseThreshold * InitialIRSize)
097a140dSpatrick    ForceStop = true;
097a140dSpatrick
097a140dSpatrick  // We can delta-update module-wide features. We know the inlining only changed
097a140dSpatrick  // the caller, and maybe the callee (by deleting the latter).
097a140dSpatrick  // Nodes are simple to update.
097a140dSpatrick  // For edges, we 'forget' the edges that the caller and callee used to have
097a140dSpatrick  // before inlining, and add back what they currently have together.
097a140dSpatrick  int64_t NewCallerAndCalleeEdges =
*d415bd75Srobert      getCachedFPI(*Caller).DirectCallsToDefinedFunctions;
097a140dSpatrick
097a140dSpatrick  if (CalleeWasDeleted)
097a140dSpatrick    --NodeCount;
097a140dSpatrick  else
73471bf0Spatrick    NewCallerAndCalleeEdges +=
*d415bd75Srobert        getCachedFPI(*Callee).DirectCallsToDefinedFunctions;
097a140dSpatrick  EdgeCount += (NewCallerAndCalleeEdges - Advice.CallerAndCalleeEdges);
097a140dSpatrick  assert(CurrentIRSize >= 0 && EdgeCount >= 0 && NodeCount >= 0);
097a140dSpatrick}
097a140dSpatrick
097a140dSpatrickint64_t MLInlineAdvisor::getModuleIRSize() const {
097a140dSpatrick  int64_t Ret = 0;
*d415bd75Srobert  for (auto &F : M)
097a140dSpatrick    if (!F.isDeclaration())
097a140dSpatrick      Ret += getIRSize(F);
097a140dSpatrick  return Ret;
097a140dSpatrick}
097a140dSpatrick
*d415bd75SrobertFunctionPropertiesInfo &MLInlineAdvisor::getCachedFPI(Function &F) const {
*d415bd75Srobert  auto InsertPair =
*d415bd75Srobert      FPICache.insert(std::make_pair(&F, FunctionPropertiesInfo()));
*d415bd75Srobert  if (!InsertPair.second)
*d415bd75Srobert    return InsertPair.first->second;
*d415bd75Srobert  InsertPair.first->second = FAM.getResult<FunctionPropertiesAnalysis>(F);
*d415bd75Srobert  return InsertPair.first->second;
*d415bd75Srobert}
*d415bd75Srobert
73471bf0Spatrickstd::unique_ptr<InlineAdvice> MLInlineAdvisor::getAdviceImpl(CallBase &CB) {
*d415bd75Srobert  if (auto Skip = getSkipAdviceIfUnreachableCallsite(CB))
*d415bd75Srobert    return Skip;
*d415bd75Srobert
097a140dSpatrick  auto &Caller = *CB.getCaller();
097a140dSpatrick  auto &Callee = *CB.getCalledFunction();
097a140dSpatrick
097a140dSpatrick  auto GetAssumptionCache = [&](Function &F) -> AssumptionCache & {
097a140dSpatrick    return FAM.getResult<AssumptionAnalysis>(F);
097a140dSpatrick  };
097a140dSpatrick  auto &TIR = FAM.getResult<TargetIRAnalysis>(Callee);
097a140dSpatrick  auto &ORE = FAM.getResult<OptimizationRemarkEmitterAnalysis>(Caller);
097a140dSpatrick
73471bf0Spatrick  auto MandatoryKind = InlineAdvisor::getMandatoryKind(CB, FAM, ORE);
097a140dSpatrick  // If this is a "never inline" case, there won't be any changes to internal
097a140dSpatrick  // state we need to track, so we can just return the base InlineAdvice, which
097a140dSpatrick  // will do nothing interesting.
097a140dSpatrick  // Same thing if this is a recursive case.
73471bf0Spatrick  if (MandatoryKind == InlineAdvisor::MandatoryInliningKind::Never ||
097a140dSpatrick      &Caller == &Callee)
73471bf0Spatrick    return getMandatoryAdvice(CB, false);
097a140dSpatrick
73471bf0Spatrick  bool Mandatory =
73471bf0Spatrick      MandatoryKind == InlineAdvisor::MandatoryInliningKind::Always;
097a140dSpatrick
097a140dSpatrick  // If we need to stop, we won't want to track anymore any state changes, so
097a140dSpatrick  // we just return the base InlineAdvice, which acts as a noop.
097a140dSpatrick  if (ForceStop) {
097a140dSpatrick    ORE.emit([&] {
097a140dSpatrick      return OptimizationRemarkMissed(DEBUG_TYPE, "ForceStop", &CB)
097a140dSpatrick             << "Won't attempt inlining because module size grew too much.";
097a140dSpatrick    });
097a140dSpatrick    return std::make_unique<InlineAdvice>(this, CB, ORE, Mandatory);
097a140dSpatrick  }
097a140dSpatrick
097a140dSpatrick  int CostEstimate = 0;
097a140dSpatrick  if (!Mandatory) {
097a140dSpatrick    auto IsCallSiteInlinable =
097a140dSpatrick        llvm::getInliningCostEstimate(CB, TIR, GetAssumptionCache);
097a140dSpatrick    if (!IsCallSiteInlinable) {
097a140dSpatrick      // We can't inline this for correctness reasons, so return the base
097a140dSpatrick      // InlineAdvice, as we don't care about tracking any state changes (which
097a140dSpatrick      // won't happen).
097a140dSpatrick      return std::make_unique<InlineAdvice>(this, CB, ORE, false);
097a140dSpatrick    }
097a140dSpatrick    CostEstimate = *IsCallSiteInlinable;
097a140dSpatrick  }
097a140dSpatrick
73471bf0Spatrick  const auto CostFeatures =
73471bf0Spatrick      llvm::getInliningCostFeatures(CB, TIR, GetAssumptionCache);
73471bf0Spatrick  if (!CostFeatures) {
73471bf0Spatrick    return std::make_unique<InlineAdvice>(this, CB, ORE, false);
73471bf0Spatrick  }
73471bf0Spatrick
097a140dSpatrick  if (Mandatory)
73471bf0Spatrick    return getMandatoryAdvice(CB, true);
097a140dSpatrick
097a140dSpatrick  auto NrCtantParams = 0;
097a140dSpatrick  for (auto I = CB.arg_begin(), E = CB.arg_end(); I != E; ++I) {
097a140dSpatrick    NrCtantParams += (isa<Constant>(*I));
097a140dSpatrick  }
097a140dSpatrick
*d415bd75Srobert  auto &CallerBefore = getCachedFPI(Caller);
*d415bd75Srobert  auto &CalleeBefore = getCachedFPI(Callee);
097a140dSpatrick
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(FeatureIndex::CalleeBasicBlockCount) =
*d415bd75Srobert      CalleeBefore.BasicBlockCount;
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(FeatureIndex::CallSiteHeight) =
*d415bd75Srobert      getInitialFunctionLevel(Caller);
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(FeatureIndex::NodeCount) = NodeCount;
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(FeatureIndex::NrCtantParams) = NrCtantParams;
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(FeatureIndex::EdgeCount) = EdgeCount;
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(FeatureIndex::CallerUsers) =
*d415bd75Srobert      CallerBefore.Uses;
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(
*d415bd75Srobert      FeatureIndex::CallerConditionallyExecutedBlocks) =
*d415bd75Srobert      CallerBefore.BlocksReachedFromConditionalInstruction;
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(FeatureIndex::CallerBasicBlockCount) =
*d415bd75Srobert      CallerBefore.BasicBlockCount;
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(
*d415bd75Srobert      FeatureIndex::CalleeConditionallyExecutedBlocks) =
*d415bd75Srobert      CalleeBefore.BlocksReachedFromConditionalInstruction;
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(FeatureIndex::CalleeUsers) =
*d415bd75Srobert      CalleeBefore.Uses;
*d415bd75Srobert  *ModelRunner->getTensor<int64_t>(FeatureIndex::CostEstimate) = CostEstimate;
73471bf0Spatrick
73471bf0Spatrick  // Add the cost features
73471bf0Spatrick  for (size_t I = 0;
73471bf0Spatrick       I < static_cast<size_t>(InlineCostFeatureIndex::NumberOfFeatures); ++I) {
*d415bd75Srobert    *ModelRunner->getTensor<int64_t>(inlineCostFeatureToMlFeature(
*d415bd75Srobert        static_cast<InlineCostFeatureIndex>(I))) = CostFeatures->at(I);
73471bf0Spatrick  }
73471bf0Spatrick
097a140dSpatrick  return getAdviceFromModel(CB, ORE);
097a140dSpatrick}
097a140dSpatrick
097a140dSpatrickstd::unique_ptr<MLInlineAdvice>
097a140dSpatrickMLInlineAdvisor::getAdviceFromModel(CallBase &CB,
097a140dSpatrick                                    OptimizationRemarkEmitter &ORE) {
*d415bd75Srobert  return std::make_unique<MLInlineAdvice>(
*d415bd75Srobert      this, CB, ORE, static_cast<bool>(ModelRunner->evaluate<int64_t>()));
*d415bd75Srobert}
*d415bd75Srobert
*d415bd75Srobertstd::unique_ptr<InlineAdvice>
*d415bd75SrobertMLInlineAdvisor::getSkipAdviceIfUnreachableCallsite(CallBase &CB) {
*d415bd75Srobert  if (!FAM.getResult<DominatorTreeAnalysis>(*CB.getCaller())
*d415bd75Srobert           .isReachableFromEntry(CB.getParent()))
*d415bd75Srobert    return std::make_unique<InlineAdvice>(this, CB, getCallerORE(CB), false);
*d415bd75Srobert  return nullptr;
097a140dSpatrick}
097a140dSpatrick
73471bf0Spatrickstd::unique_ptr<InlineAdvice> MLInlineAdvisor::getMandatoryAdvice(CallBase &CB,
73471bf0Spatrick                                                                  bool Advice) {
73471bf0Spatrick  // Make sure we track inlinings in all cases - mandatory or not.
*d415bd75Srobert  if (auto Skip = getSkipAdviceIfUnreachableCallsite(CB))
*d415bd75Srobert    return Skip;
73471bf0Spatrick  if (Advice && !ForceStop)
73471bf0Spatrick    return getMandatoryAdviceImpl(CB);
73471bf0Spatrick
73471bf0Spatrick  // If this is a "never inline" case, there won't be any changes to internal
73471bf0Spatrick  // state we need to track, so we can just return the base InlineAdvice, which
73471bf0Spatrick  // will do nothing interesting.
73471bf0Spatrick  // Same if we are forced to stop - we don't track anymore.
73471bf0Spatrick  return std::make_unique<InlineAdvice>(this, CB, getCallerORE(CB), Advice);
73471bf0Spatrick}
73471bf0Spatrick
097a140dSpatrickstd::unique_ptr<MLInlineAdvice>
73471bf0SpatrickMLInlineAdvisor::getMandatoryAdviceImpl(CallBase &CB) {
73471bf0Spatrick  return std::make_unique<MLInlineAdvice>(this, CB, getCallerORE(CB), true);
097a140dSpatrick}
097a140dSpatrick
*d415bd75Srobertvoid MLInlineAdvisor::print(raw_ostream &OS) const {
*d415bd75Srobert  OS << "[MLInlineAdvisor] Nodes: " << NodeCount << " Edges: " << EdgeCount
*d415bd75Srobert     << " EdgesOfLastSeenNodes: " << EdgesOfLastSeenNodes << "\n";
*d415bd75Srobert  OS << "[MLInlineAdvisor] FPI:\n";
*d415bd75Srobert  for (auto I : FPICache) {
*d415bd75Srobert    OS << I.first->getName() << ":\n";
*d415bd75Srobert    I.second.print(OS);
*d415bd75Srobert    OS << "\n";
*d415bd75Srobert  }
*d415bd75Srobert  OS << "\n";
*d415bd75Srobert}
*d415bd75Srobert
*d415bd75SrobertMLInlineAdvice::MLInlineAdvice(MLInlineAdvisor *Advisor, CallBase &CB,
*d415bd75Srobert                               OptimizationRemarkEmitter &ORE,
*d415bd75Srobert                               bool Recommendation)
*d415bd75Srobert    : InlineAdvice(Advisor, CB, ORE, Recommendation),
*d415bd75Srobert      CallerIRSize(Advisor->isForcedToStop() ? 0 : Advisor->getIRSize(*Caller)),
*d415bd75Srobert      CalleeIRSize(Advisor->isForcedToStop() ? 0 : Advisor->getIRSize(*Callee)),
*d415bd75Srobert      CallerAndCalleeEdges(Advisor->isForcedToStop()
*d415bd75Srobert                               ? 0
*d415bd75Srobert                               : (Advisor->getLocalCalls(*Caller) +
*d415bd75Srobert                                  Advisor->getLocalCalls(*Callee))),
*d415bd75Srobert      PreInlineCallerFPI(Advisor->getCachedFPI(*Caller)) {
*d415bd75Srobert  if (Recommendation)
*d415bd75Srobert    FPU.emplace(Advisor->getCachedFPI(*getCaller()), CB);
*d415bd75Srobert}
*d415bd75Srobert
097a140dSpatrickvoid MLInlineAdvice::reportContextForRemark(
097a140dSpatrick    DiagnosticInfoOptimizationBase &OR) {
097a140dSpatrick  using namespace ore;
097a140dSpatrick  OR << NV("Callee", Callee->getName());
097a140dSpatrick  for (size_t I = 0; I < NumberOfFeatures; ++I)
*d415bd75Srobert    OR << NV(FeatureMap[I].name(),
*d415bd75Srobert             *getAdvisor()->getModelRunner().getTensor<int64_t>(I));
097a140dSpatrick  OR << NV("ShouldInline", isInliningRecommended());
097a140dSpatrick}
097a140dSpatrick
*d415bd75Srobertvoid MLInlineAdvice::updateCachedCallerFPI(FunctionAnalysisManager &FAM) const {
*d415bd75Srobert  FPU->finish(FAM);
*d415bd75Srobert}
*d415bd75Srobert
097a140dSpatrickvoid MLInlineAdvice::recordInliningImpl() {
097a140dSpatrick  ORE.emit([&]() {
097a140dSpatrick    OptimizationRemark R(DEBUG_TYPE, "InliningSuccess", DLoc, Block);
097a140dSpatrick    reportContextForRemark(R);
097a140dSpatrick    return R;
097a140dSpatrick  });
097a140dSpatrick  getAdvisor()->onSuccessfulInlining(*this, /*CalleeWasDeleted*/ false);
097a140dSpatrick}
097a140dSpatrick
097a140dSpatrickvoid MLInlineAdvice::recordInliningWithCalleeDeletedImpl() {
097a140dSpatrick  ORE.emit([&]() {
097a140dSpatrick    OptimizationRemark R(DEBUG_TYPE, "InliningSuccessWithCalleeDeleted", DLoc,
097a140dSpatrick                         Block);
097a140dSpatrick    reportContextForRemark(R);
097a140dSpatrick    return R;
097a140dSpatrick  });
097a140dSpatrick  getAdvisor()->onSuccessfulInlining(*this, /*CalleeWasDeleted*/ true);
097a140dSpatrick}
097a140dSpatrick
097a140dSpatrickvoid MLInlineAdvice::recordUnsuccessfulInliningImpl(
097a140dSpatrick    const InlineResult &Result) {
*d415bd75Srobert  getAdvisor()->getCachedFPI(*Caller) = PreInlineCallerFPI;
097a140dSpatrick  ORE.emit([&]() {
097a140dSpatrick    OptimizationRemarkMissed R(DEBUG_TYPE, "InliningAttemptedAndUnsuccessful",
097a140dSpatrick                               DLoc, Block);
097a140dSpatrick    reportContextForRemark(R);
097a140dSpatrick    return R;
097a140dSpatrick  });
097a140dSpatrick}
097a140dSpatrickvoid MLInlineAdvice::recordUnattemptedInliningImpl() {
*d415bd75Srobert  assert(!FPU);
097a140dSpatrick  ORE.emit([&]() {
097a140dSpatrick    OptimizationRemarkMissed R(DEBUG_TYPE, "IniningNotAttempted", DLoc, Block);
097a140dSpatrick    reportContextForRemark(R);
097a140dSpatrick    return R;
097a140dSpatrick  });
097a140dSpatrick}