lib/Analysis/DevelopmentModeInlineAdvisor.cpp

*82d56013Sjoerg//===- DevelopmentModeInlineAdvisor.cpp - runtime-loadable model runner  --===//
*82d56013Sjoerg//
*82d56013Sjoerg//                     The LLVM Compiler Infrastructure
*82d56013Sjoerg//
*82d56013Sjoerg// This file is distributed under the University of Illinois Open Source
*82d56013Sjoerg// License. See LICENSE.TXT for details.
*82d56013Sjoerg//
*82d56013Sjoerg//===----------------------------------------------------------------------===//
*82d56013Sjoerg//
*82d56013Sjoerg// This file implements a model runner using Tensorflow C APIs, allowing the
*82d56013Sjoerg// loading of a model from a command line option.
*82d56013Sjoerg//
*82d56013Sjoerg//===----------------------------------------------------------------------===//
*82d56013Sjoerg#include "llvm/Config/config.h"
*82d56013Sjoerg#if defined(LLVM_HAVE_TF_API)
*82d56013Sjoerg
*82d56013Sjoerg#include "llvm/Analysis/CallGraph.h"
*82d56013Sjoerg#include "llvm/Analysis/InlineSizeEstimatorAnalysis.h"
*82d56013Sjoerg#include "llvm/Analysis/MLInlineAdvisor.h"
*82d56013Sjoerg#include "llvm/Analysis/Utils/TFUtils.h"
*82d56013Sjoerg#include "llvm/IR/LLVMContext.h"
*82d56013Sjoerg#include "llvm/Support/CommandLine.h"
*82d56013Sjoerg#include "llvm/Support/ManagedStatic.h"
*82d56013Sjoerg
*82d56013Sjoerg#include <vector>
*82d56013Sjoerg
*82d56013Sjoergusing namespace llvm;
*82d56013Sjoerg
*82d56013Sjoergstatic cl::opt<std::string> TrainingLog(
*82d56013Sjoerg    "training-log", cl::Hidden,
*82d56013Sjoerg    cl::desc("Path where the development - mode inlining log is saved."));
*82d56013Sjoerg
*82d56013Sjoergstatic cl::opt<std::string> TFModelUnderTrainingPath(
*82d56013Sjoerg    "ml-inliner-model-under-training", cl::Hidden,
*82d56013Sjoerg    cl::desc(R"(Path to SavedModel from the previous training iteration.
*82d56013SjoergThe directory is also expected to contain a JSON specification of the
*82d56013Sjoergoutputs expected to be logged, where the first entry must be the
*82d56013Sjoerginlining decision. The file containing the specification should be
*82d56013Sjoergcalled output_spec.json. The expected JSON value is an array of
*82d56013Sjoergdictionaries. Each dictionary should have 2 keys:
*82d56013Sjoerg
*82d56013Sjoerg- "tensor_spec, followed by the TensorSpec description of the
*82d56013Sjoergoutput; and
*82d56013Sjoerg- "logging_name", a string indicating the name to use when
*82d56013Sjoerglogging the output values.
*82d56013Sjoerg
*82d56013SjoergExample:
*82d56013Sjoerg[
*82d56013Sjoerg  {
*82d56013Sjoerg    "logging_name" : "some_name",
*82d56013Sjoerg    "tensor_spec" : {
*82d56013Sjoerg      "name" : "model_name",
*82d56013Sjoerg      "port" : 0,
*82d56013Sjoerg      "shape" : [2, 3],
*82d56013Sjoerg      "type" : "float"
*82d56013Sjoerg      }
*82d56013Sjoerg  }
*82d56013Sjoerg]
*82d56013Sjoerg
*82d56013SjoergThe first value must always correspond to the decision.)"));
*82d56013Sjoerg
*82d56013Sjoergstatic cl::opt<std::string> TFOutputSpecOverride(
*82d56013Sjoerg    "ml-inliner-output-spec-override", cl::Hidden,
*82d56013Sjoerg    cl::desc("Override the path to the output spec json file. See "
*82d56013Sjoerg             "-ml-inliner-model-under-training documentation for the "
*82d56013Sjoerg             "specification of that file."));
*82d56013Sjoerg
*82d56013Sjoergstatic cl::opt<std::string> TFFeedPrefix("ml-inliner-trained-model-feed-prefix",
*82d56013Sjoerg                                         cl::Hidden, cl::init("action_"),
*82d56013Sjoerg                                         cl::desc("Prefix for feature names."));
*82d56013Sjoerg
*82d56013Sjoergnamespace {
*82d56013Sjoerg/// An InlineEvent, used by TrainingLogger.
*82d56013Sjoergstruct InlineEvent {
*82d56013Sjoerg  /// What the default policy's decision would have been.
*82d56013Sjoerg  int64_t DefaultDecision = 0;
*82d56013Sjoerg
*82d56013Sjoerg  /// What we advised. When training off the default policy, this is the same as
*82d56013Sjoerg  /// DefaultDecision.
*82d56013Sjoerg  int64_t AdvisedDecision = 0;
*82d56013Sjoerg
*82d56013Sjoerg  /// What actually happened. This would be 'false' in the case of an inline
*82d56013Sjoerg  /// error, even if AdvisedDecision were true, otherwise it agrees with
*82d56013Sjoerg  /// AdvisedDecision.
*82d56013Sjoerg  bool Effect = false;
*82d56013Sjoerg
*82d56013Sjoerg  /// What the change in size was: size_after - size_before
*82d56013Sjoerg  int64_t Reward = 0;
*82d56013Sjoerg};
*82d56013Sjoerg
*82d56013Sjoerg/// Collect data we may use for training a model, and write it as a textual
*82d56013Sjoerg/// Tensorflow SequenceExample
*82d56013Sjoerg/// (https://www.tensorflow.org/api_docs/python/tf/train/SequenceExample)
*82d56013Sjoerg/// protobuf (https://developers.google.com/protocol-buffers).
*82d56013Sjoerg/// Because this is a protobuf, we cannot just stream the events as they come.
*82d56013Sjoerg/// Internally, TrainingLogger stores data in column-major format, because that
*82d56013Sjoerg/// lines up with how TF SequenceExample represents it.
*82d56013Sjoergclass ModelUnderTrainingRunner;
*82d56013Sjoergclass TrainingLogger final {
*82d56013Sjoergpublic:
*82d56013Sjoerg  TrainingLogger(StringRef LogFileName, const ModelUnderTrainingRunner *MUTR);
*82d56013Sjoerg
*82d56013Sjoerg  /// Log one inlining event.
*82d56013Sjoerg  void logInlineEvent(const InlineEvent &Event,
*82d56013Sjoerg                      const MLModelRunner &ModelRunner);
*82d56013Sjoerg
*82d56013Sjoerg  /// Print the stored tensors.
*82d56013Sjoerg  void print();
*82d56013Sjoerg
*82d56013Sjoergprivate:
*82d56013Sjoerg  StringRef LogFileName;
*82d56013Sjoerg  const ModelUnderTrainingRunner *const MUTR;
*82d56013Sjoerg  std::unique_ptr<Logger> L;
*82d56013Sjoerg  std::vector<bool> Effects;
*82d56013Sjoerg  /// There's at least one output. We'll set this to a different value if MUTR
*82d56013Sjoerg  /// is avaliable.
*82d56013Sjoerg  size_t OutputCount = 1;
*82d56013Sjoerg  /// Set these 2 clearly OOB, to make sure we set them later.
*82d56013Sjoerg  size_t DefaultDecisionPos = std::numeric_limits<size_t>::max();
*82d56013Sjoerg  size_t DecisionPos = std::numeric_limits<size_t>::max();
*82d56013Sjoerg};
*82d56013Sjoerg
*82d56013Sjoerg/// An extension of the MLInlineAdvisor for the 'development' mode, targeting
*82d56013Sjoerg/// the offline training scenario. Note that training happens outside of the
*82d56013Sjoerg/// compiler, this facility is concerned with producing training data ("logs").
*82d56013Sjoerg/// This InlineAdvisor can operate in the following modes:
*82d56013Sjoerg///
*82d56013Sjoerg/// 1) collect logs for the default policy. This is useful for bootstrapping
*82d56013Sjoerg/// training, which will be considerably faster by starting from a reasonable
*82d56013Sjoerg/// policy.
*82d56013Sjoerg///
*82d56013Sjoerg/// 2) collect logs for the ML policy, using a model from a previous
*82d56013Sjoerg/// training. Potentially, that model uses internally some small random
*82d56013Sjoerg/// perturbation of its weights, to induce exploration (setting this up is the
*82d56013Sjoerg/// responsibility of the training algorithm). The logs would then be used to
*82d56013Sjoerg/// retrain and improve on this model.
*82d56013Sjoerg///
*82d56013Sjoerg/// 3) use the provided model, with no logging. This is useful for end to end
*82d56013Sjoerg/// validation - the model, in this case, is a release candidate and shouldn't
*82d56013Sjoerg/// have random perturbations. It is a convenience feature: rather than needing
*82d56013Sjoerg/// to take the release candidate model and compile it in 'release' mode,
*82d56013Sjoerg/// validate it, then potentially discard it, it's easier to just pass the model
*82d56013Sjoerg/// to the compiler, albeit compilation would be slower, as a one-off. Once the
*82d56013Sjoerg/// model behaves satisfactorily, it can be compiled AOT, for efficiency, in
*82d56013Sjoerg/// release mode. The expectation is that a well-trained model provides a good
*82d56013Sjoerg/// policy over a sufficiently diverse codebase, over many changes (i.e.
*82d56013Sjoerg/// training happens seldom).
*82d56013Sjoergclass DevelopmentModeMLInlineAdvisor : public MLInlineAdvisor {
*82d56013Sjoergpublic:
*82d56013Sjoerg  DevelopmentModeMLInlineAdvisor(
*82d56013Sjoerg      Module &M, ModuleAnalysisManager &MAM,
*82d56013Sjoerg      std::unique_ptr<MLModelRunner> ModelRunner,
*82d56013Sjoerg      std::function<bool(CallBase &)> GetDefaultAdvice, bool IsDoingInference,
*82d56013Sjoerg      std::unique_ptr<TrainingLogger> Logger);
*82d56013Sjoerg
*82d56013Sjoerg  size_t getTotalSizeEstimate();
*82d56013Sjoerg
*82d56013Sjoerg  virtual ~DevelopmentModeMLInlineAdvisor();
*82d56013Sjoerg  void updateNativeSizeEstimate(int64_t Change) {
*82d56013Sjoerg    *CurrentNativeSize += Change;
*82d56013Sjoerg  }
*82d56013Sjoerg  void resetNativeSize(Function *F) {
*82d56013Sjoerg    PreservedAnalyses PA = PreservedAnalyses::all();
*82d56013Sjoerg    PA.abandon<InlineSizeEstimatorAnalysis>();
*82d56013Sjoerg    FAM.invalidate(*F, PA);
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoerg  std::unique_ptr<MLInlineAdvice>
*82d56013Sjoerg  getAdviceFromModel(CallBase &CB, OptimizationRemarkEmitter &ORE) override;
*82d56013Sjoerg
*82d56013Sjoerg  Optional<size_t> getNativeSizeEstimate(const Function &F) const;
*82d56013Sjoerg
*82d56013Sjoergprivate:
*82d56013Sjoerg  bool isLogging() const { return !!Logger; }
*82d56013Sjoerg  std::unique_ptr<MLInlineAdvice> getMandatoryAdviceImpl(CallBase &CB) override;
*82d56013Sjoerg
*82d56013Sjoerg  std::function<bool(CallBase &)> GetDefaultAdvice;
*82d56013Sjoerg  const bool IsDoingInference;
*82d56013Sjoerg  std::unique_ptr<TrainingLogger> Logger;
*82d56013Sjoerg
*82d56013Sjoerg  const Optional<int32_t> InitialNativeSize;
*82d56013Sjoerg  Optional<int32_t> CurrentNativeSize;
*82d56013Sjoerg};
*82d56013Sjoerg
*82d56013Sjoerg/// A variant of MLInlineAdvice that tracks all non-trivial inlining
*82d56013Sjoerg/// decisions, for training/logging.
*82d56013Sjoergclass LoggingMLInlineAdvice : public MLInlineAdvice {
*82d56013Sjoergpublic:
*82d56013Sjoerg  LoggingMLInlineAdvice(DevelopmentModeMLInlineAdvisor *Advisor, CallBase &CB,
*82d56013Sjoerg                        OptimizationRemarkEmitter &ORE, bool Recommendation,
*82d56013Sjoerg                        TrainingLogger &Logger,
*82d56013Sjoerg                        Optional<size_t> CallerSizeEstimateBefore,
*82d56013Sjoerg                        Optional<size_t> CalleeSizeEstimateBefore,
*82d56013Sjoerg                        bool DefaultDecision, bool Mandatory = false)
*82d56013Sjoerg      : MLInlineAdvice(Advisor, CB, ORE, Recommendation), Logger(Logger),
*82d56013Sjoerg        CallerSizeEstimateBefore(CallerSizeEstimateBefore),
*82d56013Sjoerg        CalleeSizeEstimateBefore(CalleeSizeEstimateBefore),
*82d56013Sjoerg        DefaultDecision(DefaultDecision), Mandatory(Mandatory) {}
*82d56013Sjoerg
*82d56013Sjoerg  virtual ~LoggingMLInlineAdvice() = default;
*82d56013Sjoerg
*82d56013Sjoergprivate:
*82d56013Sjoerg  DevelopmentModeMLInlineAdvisor *getAdvisor() const {
*82d56013Sjoerg    return static_cast<DevelopmentModeMLInlineAdvisor *>(Advisor);
*82d56013Sjoerg  }
*82d56013Sjoerg  void recordInliningImpl() override {
*82d56013Sjoerg    MLInlineAdvice::recordInliningImpl();
*82d56013Sjoerg    getAdvisor()->resetNativeSize(Caller);
*82d56013Sjoerg    int Reward = std::numeric_limits<int>::max();
*82d56013Sjoerg    if (InlineSizeEstimatorAnalysis::isEvaluatorRequested() &&
*82d56013Sjoerg        !getAdvisor()->isForcedToStop()) {
*82d56013Sjoerg      int NativeSizeAfter = *getAdvisor()->getNativeSizeEstimate(*Caller) +
*82d56013Sjoerg                            *CalleeSizeEstimateBefore;
*82d56013Sjoerg      Reward = NativeSizeAfter -
*82d56013Sjoerg               (*CallerSizeEstimateBefore + *CalleeSizeEstimateBefore);
*82d56013Sjoerg      getAdvisor()->updateNativeSizeEstimate(Reward);
*82d56013Sjoerg    }
*82d56013Sjoerg    log(Reward, /*Success=*/true);
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoerg  void recordInliningWithCalleeDeletedImpl() override {
*82d56013Sjoerg    MLInlineAdvice::recordInliningWithCalleeDeletedImpl();
*82d56013Sjoerg    getAdvisor()->resetNativeSize(Caller);
*82d56013Sjoerg    if (InlineSizeEstimatorAnalysis::isEvaluatorRequested() &&
*82d56013Sjoerg        !getAdvisor()->isForcedToStop()) {
*82d56013Sjoerg      int NativeSizeAfter = *getAdvisor()->getNativeSizeEstimate(*Caller);
*82d56013Sjoerg      int Reward = NativeSizeAfter -
*82d56013Sjoerg                   (*CallerSizeEstimateBefore + *CalleeSizeEstimateBefore);
*82d56013Sjoerg      getAdvisor()->updateNativeSizeEstimate(Reward);
*82d56013Sjoerg      log(Reward, /*Success=*/true);
*82d56013Sjoerg    }
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoerg  void recordUnsuccessfulInliningImpl(const InlineResult &Result) override {
*82d56013Sjoerg    MLInlineAdvice::recordUnsuccessfulInliningImpl(Result);
*82d56013Sjoerg    log(NoReward, /*Success=*/false);
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoerg  void recordUnattemptedInliningImpl() override {
*82d56013Sjoerg    MLInlineAdvice::recordUnattemptedInliningImpl();
*82d56013Sjoerg    log(NoReward, /*Success=*/false);
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoerg  void log(int64_t Reward, bool Success) {
*82d56013Sjoerg    if (Mandatory)
*82d56013Sjoerg      return;
*82d56013Sjoerg    InlineEvent Event;
*82d56013Sjoerg    Event.AdvisedDecision = isInliningRecommended();
*82d56013Sjoerg    Event.DefaultDecision = DefaultDecision;
*82d56013Sjoerg    Event.Effect = Success;
*82d56013Sjoerg    Event.Reward = Reward;
*82d56013Sjoerg    Logger.logInlineEvent(Event, getAdvisor()->getModelRunner());
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoerg  static const int64_t NoReward = 0;
*82d56013Sjoerg  TrainingLogger &Logger;
*82d56013Sjoerg  const Optional<size_t> CallerSizeEstimateBefore;
*82d56013Sjoerg  const Optional<size_t> CalleeSizeEstimateBefore;
*82d56013Sjoerg  const int64_t DefaultDecision;
*82d56013Sjoerg  const int64_t Mandatory;
*82d56013Sjoerg};
*82d56013Sjoerg
*82d56013Sjoerg/// A pseudo model runner. We use it to store feature values when collecting
*82d56013Sjoerg/// logs for the default policy, but never ask it to 'run'.
*82d56013Sjoergclass NoInferenceModelRunner : public MLModelRunner {
*82d56013Sjoergpublic:
*82d56013Sjoerg  NoInferenceModelRunner(LLVMContext &Ctx)
*82d56013Sjoerg      : MLModelRunner(Ctx), Features(NumberOfFeatures) {}
*82d56013Sjoerg  void setFeature(FeatureIndex Index, int64_t Value) override {
*82d56013Sjoerg    Features[static_cast<int>(Index)] = Value;
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoerg  int64_t getFeature(int Index) const override { return Features[Index]; }
*82d56013Sjoerg  bool run() override {
*82d56013Sjoerg    llvm_unreachable("We shouldn't call run on this model runner.");
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoergprivate:
*82d56013Sjoerg  InlineFeatures Features;
*82d56013Sjoerg};
*82d56013Sjoerg
*82d56013Sjoerg/// ModelUnderTrainingRunner - training mode implementation. It uses TF C APIs
*82d56013Sjoerg/// to dynamically load and evaluate a TF SavedModel
*82d56013Sjoerg/// (https://www.tensorflow.org/guide/saved_model). Runtime performance is
*82d56013Sjoerg/// sacrificed for ease of use while training.
*82d56013Sjoergclass ModelUnderTrainingRunner final : public MLModelRunner {
*82d56013Sjoergpublic:
*82d56013Sjoerg  ModelUnderTrainingRunner(LLVMContext &Ctx, const std::string &ModelPath);
*82d56013Sjoerg
*82d56013Sjoerg  bool run() override;
*82d56013Sjoerg
*82d56013Sjoerg  // Disallows copy and assign.
*82d56013Sjoerg  ModelUnderTrainingRunner(const ModelUnderTrainingRunner &) = delete;
*82d56013Sjoerg  ModelUnderTrainingRunner &
*82d56013Sjoerg  operator=(const ModelUnderTrainingRunner &) = delete;
*82d56013Sjoerg
*82d56013Sjoerg  void setFeature(FeatureIndex Index, int64_t Value) override;
*82d56013Sjoerg  int64_t getFeature(int Index) const override;
*82d56013Sjoerg  bool isValid() const { return !!Evaluator; }
*82d56013Sjoerg
*82d56013Sjoerg  const std::vector<LoggedFeatureSpec> &outputLoggedFeatureSpecs() const {
*82d56013Sjoerg    return OutputSpecs;
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoerg  const Optional<TFModelEvaluator::EvaluationResult> &
*82d56013Sjoerg  lastEvaluationResult() const {
*82d56013Sjoerg    return LastEvaluationResult;
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoergprivate:
*82d56013Sjoerg  std::unique_ptr<TFModelEvaluator> Evaluator;
*82d56013Sjoerg  std::vector<LoggedFeatureSpec> OutputSpecs;
*82d56013Sjoerg  Optional<TFModelEvaluator::EvaluationResult> LastEvaluationResult;
*82d56013Sjoerg
*82d56013Sjoerg  // The training framework needs some additional features.
*82d56013Sjoerg  const std::vector<TensorSpec> TrainingOnlyFeatures{
*82d56013Sjoerg      TensorSpec::createSpec<int64_t>(TFFeedPrefix + "inlining_default", {1}),
*82d56013Sjoerg      TensorSpec::createSpec<float>(TFFeedPrefix + "discount", {1}),
*82d56013Sjoerg      TensorSpec::createSpec<float>(TFFeedPrefix + "reward", {1}),
*82d56013Sjoerg      TensorSpec::createSpec<int32_t>(TFFeedPrefix + "step_type", {1})};
*82d56013Sjoerg};
*82d56013Sjoerg} // namespace
*82d56013Sjoerg
*82d56013SjoergTrainingLogger::TrainingLogger(StringRef LogFileName,
*82d56013Sjoerg                               const ModelUnderTrainingRunner *MUTR)
*82d56013Sjoerg    : LogFileName(LogFileName), MUTR(MUTR) {
*82d56013Sjoerg  // The first output is the inlining decision.
*82d56013Sjoerg  if (MUTR)
*82d56013Sjoerg    OutputCount = MUTR->outputLoggedFeatureSpecs().size();
*82d56013Sjoerg  std::vector<LoggedFeatureSpec> FT;
*82d56013Sjoerg
*82d56013Sjoerg  for (size_t I = 0; I < NumberOfFeatures; ++I)
*82d56013Sjoerg    FT.push_back(
*82d56013Sjoerg        {TensorSpec::createSpec<int64_t>(FeatureNameMap.at(I), {1}), None});
*82d56013Sjoerg  if (MUTR && MUTR->outputLoggedFeatureSpecs().size() > 1)
*82d56013Sjoerg    append_range(FT, drop_begin(MUTR->outputLoggedFeatureSpecs()));
*82d56013Sjoerg
*82d56013Sjoerg  DefaultDecisionPos = FT.size();
*82d56013Sjoerg  FT.push_back(
*82d56013Sjoerg      {TensorSpec::createSpec<int64_t>(DefaultDecisionName, {1}), None});
*82d56013Sjoerg
*82d56013Sjoerg  DecisionPos = FT.size();
*82d56013Sjoerg  FT.push_back({TensorSpec::createSpec<int64_t>(DecisionName, {1}), None});
*82d56013Sjoerg
*82d56013Sjoerg  L = std::make_unique<Logger>(
*82d56013Sjoerg      FT, TensorSpec::createSpec<int64_t>(RewardName, {1}),
*82d56013Sjoerg      InlineSizeEstimatorAnalysis::isEvaluatorRequested());
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013Sjoerg/// Log one inlining event.
*82d56013Sjoergvoid TrainingLogger::logInlineEvent(const InlineEvent &Event,
*82d56013Sjoerg                                    const MLModelRunner &ModelRunner) {
*82d56013Sjoerg  size_t CurrentFeature = 0;
*82d56013Sjoerg  for (; CurrentFeature < NumberOfFeatures; ++CurrentFeature) {
*82d56013Sjoerg    int64_t F = ModelRunner.getFeature(CurrentFeature);
*82d56013Sjoerg    L->logTensorValue(CurrentFeature, &F);
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoerg  for (size_t I = 1; I < OutputCount; ++I) {
*82d56013Sjoerg    const auto &Result = *MUTR->lastEvaluationResult();
*82d56013Sjoerg    auto &Spec = MUTR->outputLoggedFeatureSpecs()[I].Spec;
*82d56013Sjoerg    const char *RawData =
*82d56013Sjoerg        reinterpret_cast<const char *>(Result.getUntypedTensorValue(I));
*82d56013Sjoerg    L->logTensorValue(CurrentFeature, RawData,
*82d56013Sjoerg                      Spec.getElementCount() * Spec.getElementByteSize());
*82d56013Sjoerg    ++CurrentFeature;
*82d56013Sjoerg  }
*82d56013Sjoerg
*82d56013Sjoerg  assert(CurrentFeature == DefaultDecisionPos);
*82d56013Sjoerg  L->logTensorValue(DefaultDecisionPos, &Event.DefaultDecision);
*82d56013Sjoerg  L->logTensorValue(DecisionPos, &Event.AdvisedDecision);
*82d56013Sjoerg  if (InlineSizeEstimatorAnalysis::isEvaluatorRequested())
*82d56013Sjoerg    L->logReward(Event.Reward);
*82d56013Sjoerg
*82d56013Sjoerg  // For debugging / later use
*82d56013Sjoerg  Effects.push_back(Event.Effect);
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013Sjoergvoid TrainingLogger::print() {
*82d56013Sjoerg  std::error_code EC;
*82d56013Sjoerg  raw_fd_ostream OutFile(LogFileName, EC);
*82d56013Sjoerg  L->print(OutFile);
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013SjoergDevelopmentModeMLInlineAdvisor::DevelopmentModeMLInlineAdvisor(
*82d56013Sjoerg    Module &M, ModuleAnalysisManager &MAM,
*82d56013Sjoerg    std::unique_ptr<MLModelRunner> ModelRunner,
*82d56013Sjoerg    std::function<bool(CallBase &)> GetDefaultAdvice, bool IsDoingInference,
*82d56013Sjoerg    std::unique_ptr<TrainingLogger> Logger)
*82d56013Sjoerg    : MLInlineAdvisor(M, MAM, std::move(ModelRunner)),
*82d56013Sjoerg      GetDefaultAdvice(GetDefaultAdvice), IsDoingInference(IsDoingInference),
*82d56013Sjoerg      Logger(std::move(Logger)),
*82d56013Sjoerg      InitialNativeSize(isLogging() ? getTotalSizeEstimate() : 0),
*82d56013Sjoerg      CurrentNativeSize(InitialNativeSize) {
*82d56013Sjoerg  // We cannot have the case of neither inference nor logging.
*82d56013Sjoerg  assert(IsDoingInference || isLogging());
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013SjoergDevelopmentModeMLInlineAdvisor::~DevelopmentModeMLInlineAdvisor() {
*82d56013Sjoerg  if (isLogging())
*82d56013Sjoerg    Logger->print();
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013SjoergOptional<size_t>
*82d56013SjoergDevelopmentModeMLInlineAdvisor::getNativeSizeEstimate(const Function &F) const {
*82d56013Sjoerg  if (!InlineSizeEstimatorAnalysis::isEvaluatorRequested())
*82d56013Sjoerg    return None;
*82d56013Sjoerg  auto &R =
*82d56013Sjoerg      FAM.getResult<InlineSizeEstimatorAnalysis>(const_cast<Function &>(F));
*82d56013Sjoerg  if (!R) {
*82d56013Sjoerg    F.getParent()->getContext().emitError(
*82d56013Sjoerg        "Native size estimator is not present.");
*82d56013Sjoerg    return 0;
*82d56013Sjoerg  }
*82d56013Sjoerg  return *R;
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013Sjoergstd::unique_ptr<MLInlineAdvice>
*82d56013SjoergDevelopmentModeMLInlineAdvisor::getMandatoryAdviceImpl(CallBase &CB) {
*82d56013Sjoerg  return std::make_unique<LoggingMLInlineAdvice>(
*82d56013Sjoerg      /*Advisor=*/this,
*82d56013Sjoerg      /*CB=*/CB, /*ORE=*/getCallerORE(CB), /*Recommendation=*/true,
*82d56013Sjoerg      /*Logger=*/*Logger,
*82d56013Sjoerg      /*CallerSizeEstimateBefore=*/getNativeSizeEstimate(*CB.getCaller()),
*82d56013Sjoerg      /*CalleeSizeEstimateBefore=*/
*82d56013Sjoerg      getNativeSizeEstimate(*CB.getCalledFunction()),
*82d56013Sjoerg      /*DefaultDecision=*/true, /*Mandatory*/ true);
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013Sjoergstd::unique_ptr<MLInlineAdvice>
*82d56013SjoergDevelopmentModeMLInlineAdvisor::getAdviceFromModel(
*82d56013Sjoerg    CallBase &CB, OptimizationRemarkEmitter &ORE) {
*82d56013Sjoerg  if (IsDoingInference && !isLogging())
*82d56013Sjoerg    return MLInlineAdvisor::getAdviceFromModel(CB, ORE);
*82d56013Sjoerg
*82d56013Sjoerg  bool DefaultAdvice = GetDefaultAdvice(CB);
*82d56013Sjoerg  auto Recommendation = IsDoingInference ? ModelRunner->run() : DefaultAdvice;
*82d56013Sjoerg  return std::make_unique<LoggingMLInlineAdvice>(
*82d56013Sjoerg      /*Advisor=*/this,
*82d56013Sjoerg      /*CB=*/CB, /*ORE=*/ORE, /*Recommendation=*/Recommendation,
*82d56013Sjoerg      /*Logger=*/*Logger,
*82d56013Sjoerg      /*CallerSizeEstimateBefore=*/getNativeSizeEstimate(*CB.getCaller()),
*82d56013Sjoerg      /*CalleeSizeEstimateBefore=*/
*82d56013Sjoerg      getNativeSizeEstimate(*CB.getCalledFunction()),
*82d56013Sjoerg      /*DefaultDecision=*/DefaultAdvice);
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013Sjoergsize_t DevelopmentModeMLInlineAdvisor::getTotalSizeEstimate() {
*82d56013Sjoerg  if (!InlineSizeEstimatorAnalysis::isEvaluatorRequested())
*82d56013Sjoerg    return 0;
*82d56013Sjoerg  size_t Ret = 0;
*82d56013Sjoerg  for (auto &F : M) {
*82d56013Sjoerg    if (F.isDeclaration())
*82d56013Sjoerg      continue;
*82d56013Sjoerg    if (isFunctionDeleted(&F))
*82d56013Sjoerg      continue;
*82d56013Sjoerg    Ret += *getNativeSizeEstimate(F);
*82d56013Sjoerg  }
*82d56013Sjoerg  return Ret;
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013SjoergModelUnderTrainingRunner::ModelUnderTrainingRunner(LLVMContext &Ctx,
*82d56013Sjoerg                                                   const std::string &ModelPath)
*82d56013Sjoerg    : MLModelRunner(Ctx) {
*82d56013Sjoerg  std::vector<TensorSpec> InputSpecs;
*82d56013Sjoerg  for (size_t I = 0; I < NumberOfFeatures; ++I)
*82d56013Sjoerg    InputSpecs.push_back(
*82d56013Sjoerg        TensorSpec::createSpec<int64_t>(TFFeedPrefix + FeatureNameMap[I], {1}));
*82d56013Sjoerg  append_range(InputSpecs, TrainingOnlyFeatures);
*82d56013Sjoerg  if (auto MaybeOutSpecs =
*82d56013Sjoerg          loadOutputSpecs(Ctx, DecisionName, ModelPath, TFOutputSpecOverride))
*82d56013Sjoerg    OutputSpecs = std::move(*MaybeOutSpecs);
*82d56013Sjoerg  else
*82d56013Sjoerg    return;
*82d56013Sjoerg
*82d56013Sjoerg  Evaluator = std::make_unique<TFModelEvaluator>(
*82d56013Sjoerg      ModelPath, InputSpecs, [&](size_t I) { return OutputSpecs[I].Spec; },
*82d56013Sjoerg      OutputSpecs.size());
*82d56013Sjoerg  if (!Evaluator || !Evaluator->isValid()) {
*82d56013Sjoerg    Ctx.emitError("Failed to create inliner saved model evaluator");
*82d56013Sjoerg    Evaluator.reset();
*82d56013Sjoerg    return;
*82d56013Sjoerg  }
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013Sjoergbool ModelUnderTrainingRunner::run() {
*82d56013Sjoerg  LastEvaluationResult = Evaluator->evaluate();
*82d56013Sjoerg  if (!LastEvaluationResult.hasValue()) {
*82d56013Sjoerg    Ctx.emitError("Error evaluating model.");
*82d56013Sjoerg    return false;
*82d56013Sjoerg  }
*82d56013Sjoerg  int64_t Decision = *LastEvaluationResult->getTensorValue<int64_t>(0);
*82d56013Sjoerg  return static_cast<bool>(Decision);
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013Sjoergint64_t ModelUnderTrainingRunner::getFeature(int Index) const {
*82d56013Sjoerg  return *Evaluator->getInput<int64_t>(Index);
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013Sjoergvoid ModelUnderTrainingRunner::setFeature(FeatureIndex Index, int64_t Value) {
*82d56013Sjoerg  size_t NumericIndex = static_cast<size_t>(Index);
*82d56013Sjoerg  *(Evaluator->getInput<int64_t>(NumericIndex)) = Value;
*82d56013Sjoerg}
*82d56013Sjoerg
*82d56013Sjoergstd::unique_ptr<InlineAdvisor> llvm::getDevelopmentModeAdvisor(
*82d56013Sjoerg    Module &M, ModuleAnalysisManager &MAM,
*82d56013Sjoerg    std::function<bool(CallBase &)> GetDefaultAdvice) {
*82d56013Sjoerg  auto &Ctx = M.getContext();
*82d56013Sjoerg  std::unique_ptr<MLModelRunner> Runner;
*82d56013Sjoerg  ModelUnderTrainingRunner *MUTRPtr = nullptr;
*82d56013Sjoerg  bool IsDoingInference = false;
*82d56013Sjoerg  if (TFModelUnderTrainingPath.empty())
*82d56013Sjoerg    Runner.reset(new NoInferenceModelRunner(Ctx));
*82d56013Sjoerg  else {
*82d56013Sjoerg    auto MUTR = std::make_unique<ModelUnderTrainingRunner>(
*82d56013Sjoerg        Ctx, TFModelUnderTrainingPath);
*82d56013Sjoerg    if (!MUTR || !MUTR->isValid()) {
*82d56013Sjoerg      Ctx.emitError("Could not load the policy model from the provided path");
*82d56013Sjoerg      return nullptr;
*82d56013Sjoerg    }
*82d56013Sjoerg    IsDoingInference = true;
*82d56013Sjoerg    MUTRPtr = MUTR.get();
*82d56013Sjoerg    Runner = std::move(MUTR);
*82d56013Sjoerg  }
*82d56013Sjoerg  std::unique_ptr<TrainingLogger> Logger;
*82d56013Sjoerg  if (!TrainingLog.empty())
*82d56013Sjoerg    Logger = std::make_unique<TrainingLogger>(TrainingLog, MUTRPtr);
*82d56013Sjoerg
*82d56013Sjoerg  return std::make_unique<DevelopmentModeMLInlineAdvisor>(
*82d56013Sjoerg      M, MAM, std::move(Runner), GetDefaultAdvice, IsDoingInference,
*82d56013Sjoerg      std::move(Logger));
*82d56013Sjoerg}
*82d56013Sjoerg#endif // defined(LLVM_HAVE_TF_API)