lib/Analysis/DevelopmentModeInlineAdvisor.cpp

e8d8bef9SDimitry Andric//===- DevelopmentModeInlineAdvisor.cpp - runtime-loadable model runner  --===//
e8d8bef9SDimitry Andric//
349cc55cSDimitry Andric// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
349cc55cSDimitry Andric// See https://llvm.org/LICENSE.txt for license information.
349cc55cSDimitry Andric// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
e8d8bef9SDimitry Andric//
e8d8bef9SDimitry Andric//===----------------------------------------------------------------------===//
e8d8bef9SDimitry Andric//
*c9157d92SDimitry Andric// This file implements a model runner using TFLite, allowing the
e8d8bef9SDimitry Andric// loading of a model from a command line option.
e8d8bef9SDimitry Andric//
e8d8bef9SDimitry Andric//===----------------------------------------------------------------------===//
bdd1243dSDimitry Andric#include "llvm/Analysis/TensorSpec.h"
e8d8bef9SDimitry Andric#include "llvm/Config/config.h"
bdd1243dSDimitry Andric#if defined(LLVM_HAVE_TFLITE)
e8d8bef9SDimitry Andric
04eeddc0SDimitry Andric#include "llvm/ADT/BitVector.h"
e8d8bef9SDimitry Andric#include "llvm/Analysis/CallGraph.h"
e8d8bef9SDimitry Andric#include "llvm/Analysis/InlineSizeEstimatorAnalysis.h"
e8d8bef9SDimitry Andric#include "llvm/Analysis/MLInlineAdvisor.h"
0eae32dcSDimitry Andric#include "llvm/Analysis/ModelUnderTrainingRunner.h"
0eae32dcSDimitry Andric#include "llvm/Analysis/NoInferenceModelRunner.h"
e8d8bef9SDimitry Andric#include "llvm/Analysis/Utils/TFUtils.h"
bdd1243dSDimitry Andric#include "llvm/Analysis/Utils/TrainingLogger.h"
e8d8bef9SDimitry Andric#include "llvm/IR/LLVMContext.h"
e8d8bef9SDimitry Andric#include "llvm/Support/CommandLine.h"
e8d8bef9SDimitry Andric#include "llvm/Support/ManagedStatic.h"
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric#include <vector>
bdd1243dSDimitry Andric#include <optional>
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricusing namespace llvm;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstatic cl::opt<std::string> TrainingLog(
e8d8bef9SDimitry Andric    "training-log", cl::Hidden,
e8d8bef9SDimitry Andric    cl::desc("Path where the development - mode inlining log is saved."));
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstatic cl::opt<std::string> TFModelUnderTrainingPath(
e8d8bef9SDimitry Andric    "ml-inliner-model-under-training", cl::Hidden,
e8d8bef9SDimitry Andric    cl::desc(R"(Path to SavedModel from the previous training iteration.
e8d8bef9SDimitry AndricThe directory is also expected to contain a JSON specification of the
e8d8bef9SDimitry Andricoutputs expected to be logged, where the first entry must be the
e8d8bef9SDimitry Andricinlining decision. The file containing the specification should be
e8d8bef9SDimitry Andriccalled output_spec.json. The expected JSON value is an array of
e8d8bef9SDimitry Andricdictionaries. Each dictionary should have 2 keys:
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric- "tensor_spec, followed by the TensorSpec description of the
e8d8bef9SDimitry Andricoutput; and
e8d8bef9SDimitry Andric- "logging_name", a string indicating the name to use when
e8d8bef9SDimitry Andriclogging the output values.
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricExample:
e8d8bef9SDimitry Andric[
e8d8bef9SDimitry Andric  {
e8d8bef9SDimitry Andric    "logging_name" : "some_name",
e8d8bef9SDimitry Andric    "tensor_spec" : {
e8d8bef9SDimitry Andric      "name" : "model_name",
e8d8bef9SDimitry Andric      "port" : 0,
e8d8bef9SDimitry Andric      "shape" : [2, 3],
e8d8bef9SDimitry Andric      "type" : "float"
e8d8bef9SDimitry Andric      }
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric]
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricThe first value must always correspond to the decision.)"));
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstatic cl::opt<std::string> TFOutputSpecOverride(
e8d8bef9SDimitry Andric    "ml-inliner-output-spec-override", cl::Hidden,
e8d8bef9SDimitry Andric    cl::desc("Override the path to the output spec json file. See "
e8d8bef9SDimitry Andric             "-ml-inliner-model-under-training documentation for the "
e8d8bef9SDimitry Andric             "specification of that file."));
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstatic cl::opt<std::string> TFFeedPrefix("ml-inliner-trained-model-feed-prefix",
e8d8bef9SDimitry Andric                                         cl::Hidden, cl::init("action_"),
e8d8bef9SDimitry Andric                                         cl::desc("Prefix for feature names."));
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricnamespace {
e8d8bef9SDimitry Andric/// An InlineEvent, used by TrainingLogger.
e8d8bef9SDimitry Andricstruct InlineEvent {
e8d8bef9SDimitry Andric  /// What the default policy's decision would have been.
e8d8bef9SDimitry Andric  int64_t DefaultDecision = 0;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  /// What we advised. When training off the default policy, this is the same as
e8d8bef9SDimitry Andric  /// DefaultDecision.
e8d8bef9SDimitry Andric  int64_t AdvisedDecision = 0;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  /// What actually happened. This would be 'false' in the case of an inline
e8d8bef9SDimitry Andric  /// error, even if AdvisedDecision were true, otherwise it agrees with
e8d8bef9SDimitry Andric  /// AdvisedDecision.
e8d8bef9SDimitry Andric  bool Effect = false;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  /// What the change in size was: size_after - size_before
e8d8bef9SDimitry Andric  int64_t Reward = 0;
e8d8bef9SDimitry Andric};
e8d8bef9SDimitry Andric
bdd1243dSDimitry Andric/// Collect data we may use for training a model.
e8d8bef9SDimitry Andricclass TrainingLogger final {
e8d8bef9SDimitry Andricpublic:
e8d8bef9SDimitry Andric  TrainingLogger(StringRef LogFileName, const ModelUnderTrainingRunner *MUTR);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  /// Log one inlining event.
e8d8bef9SDimitry Andric  void logInlineEvent(const InlineEvent &Event,
e8d8bef9SDimitry Andric                      const MLModelRunner &ModelRunner);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricprivate:
e8d8bef9SDimitry Andric  StringRef LogFileName;
e8d8bef9SDimitry Andric  const ModelUnderTrainingRunner *const MUTR;
e8d8bef9SDimitry Andric  std::unique_ptr<Logger> L;
04eeddc0SDimitry Andric  BitVector Effects;
e8d8bef9SDimitry Andric  /// Set these 2 clearly OOB, to make sure we set them later.
e8d8bef9SDimitry Andric  size_t DefaultDecisionPos = std::numeric_limits<size_t>::max();
e8d8bef9SDimitry Andric  size_t DecisionPos = std::numeric_limits<size_t>::max();
e8d8bef9SDimitry Andric};
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric/// An extension of the MLInlineAdvisor for the 'development' mode, targeting
e8d8bef9SDimitry Andric/// the offline training scenario. Note that training happens outside of the
e8d8bef9SDimitry Andric/// compiler, this facility is concerned with producing training data ("logs").
e8d8bef9SDimitry Andric/// This InlineAdvisor can operate in the following modes:
e8d8bef9SDimitry Andric///
e8d8bef9SDimitry Andric/// 1) collect logs for the default policy. This is useful for bootstrapping
e8d8bef9SDimitry Andric/// training, which will be considerably faster by starting from a reasonable
e8d8bef9SDimitry Andric/// policy.
e8d8bef9SDimitry Andric///
e8d8bef9SDimitry Andric/// 2) collect logs for the ML policy, using a model from a previous
e8d8bef9SDimitry Andric/// training. Potentially, that model uses internally some small random
e8d8bef9SDimitry Andric/// perturbation of its weights, to induce exploration (setting this up is the
e8d8bef9SDimitry Andric/// responsibility of the training algorithm). The logs would then be used to
e8d8bef9SDimitry Andric/// retrain and improve on this model.
e8d8bef9SDimitry Andric///
e8d8bef9SDimitry Andric/// 3) use the provided model, with no logging. This is useful for end to end
e8d8bef9SDimitry Andric/// validation - the model, in this case, is a release candidate and shouldn't
e8d8bef9SDimitry Andric/// have random perturbations. It is a convenience feature: rather than needing
e8d8bef9SDimitry Andric/// to take the release candidate model and compile it in 'release' mode,
e8d8bef9SDimitry Andric/// validate it, then potentially discard it, it's easier to just pass the model
e8d8bef9SDimitry Andric/// to the compiler, albeit compilation would be slower, as a one-off. Once the
e8d8bef9SDimitry Andric/// model behaves satisfactorily, it can be compiled AOT, for efficiency, in
e8d8bef9SDimitry Andric/// release mode. The expectation is that a well-trained model provides a good
e8d8bef9SDimitry Andric/// policy over a sufficiently diverse codebase, over many changes (i.e.
e8d8bef9SDimitry Andric/// training happens seldom).
e8d8bef9SDimitry Andricclass DevelopmentModeMLInlineAdvisor : public MLInlineAdvisor {
e8d8bef9SDimitry Andricpublic:
e8d8bef9SDimitry Andric  DevelopmentModeMLInlineAdvisor(
e8d8bef9SDimitry Andric      Module &M, ModuleAnalysisManager &MAM,
e8d8bef9SDimitry Andric      std::unique_ptr<MLModelRunner> ModelRunner,
04eeddc0SDimitry Andric      std::function<bool(CallBase &)> GetDefaultAdvice,
e8d8bef9SDimitry Andric      std::unique_ptr<TrainingLogger> Logger);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  size_t getTotalSizeEstimate();
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  void updateNativeSizeEstimate(int64_t Change) {
e8d8bef9SDimitry Andric    *CurrentNativeSize += Change;
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric  void resetNativeSize(Function *F) {
fe6060f1SDimitry Andric    PreservedAnalyses PA = PreservedAnalyses::all();
fe6060f1SDimitry Andric    PA.abandon<InlineSizeEstimatorAnalysis>();
fe6060f1SDimitry Andric    FAM.invalidate(*F, PA);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  std::unique_ptr<MLInlineAdvice>
e8d8bef9SDimitry Andric  getAdviceFromModel(CallBase &CB, OptimizationRemarkEmitter &ORE) override;
e8d8bef9SDimitry Andric
bdd1243dSDimitry Andric  std::optional<size_t> getNativeSizeEstimate(const Function &F) const;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricprivate:
e8d8bef9SDimitry Andric  bool isLogging() const { return !!Logger; }
e8d8bef9SDimitry Andric  std::unique_ptr<MLInlineAdvice> getMandatoryAdviceImpl(CallBase &CB) override;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  const bool IsDoingInference;
e8d8bef9SDimitry Andric  std::unique_ptr<TrainingLogger> Logger;
e8d8bef9SDimitry Andric
bdd1243dSDimitry Andric  const std::optional<int32_t> InitialNativeSize;
bdd1243dSDimitry Andric  std::optional<int32_t> CurrentNativeSize;
e8d8bef9SDimitry Andric};
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric/// A variant of MLInlineAdvice that tracks all non-trivial inlining
e8d8bef9SDimitry Andric/// decisions, for training/logging.
e8d8bef9SDimitry Andricclass LoggingMLInlineAdvice : public MLInlineAdvice {
e8d8bef9SDimitry Andricpublic:
e8d8bef9SDimitry Andric  LoggingMLInlineAdvice(DevelopmentModeMLInlineAdvisor *Advisor, CallBase &CB,
e8d8bef9SDimitry Andric                        OptimizationRemarkEmitter &ORE, bool Recommendation,
e8d8bef9SDimitry Andric                        TrainingLogger &Logger,
bdd1243dSDimitry Andric                        std::optional<size_t> CallerSizeEstimateBefore,
bdd1243dSDimitry Andric                        std::optional<size_t> CalleeSizeEstimateBefore,
e8d8bef9SDimitry Andric                        bool DefaultDecision, bool Mandatory = false)
e8d8bef9SDimitry Andric      : MLInlineAdvice(Advisor, CB, ORE, Recommendation), Logger(Logger),
e8d8bef9SDimitry Andric        CallerSizeEstimateBefore(CallerSizeEstimateBefore),
e8d8bef9SDimitry Andric        CalleeSizeEstimateBefore(CalleeSizeEstimateBefore),
e8d8bef9SDimitry Andric        DefaultDecision(DefaultDecision), Mandatory(Mandatory) {}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  virtual ~LoggingMLInlineAdvice() = default;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricprivate:
e8d8bef9SDimitry Andric  DevelopmentModeMLInlineAdvisor *getAdvisor() const {
e8d8bef9SDimitry Andric    return static_cast<DevelopmentModeMLInlineAdvisor *>(Advisor);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric  void recordInliningImpl() override {
e8d8bef9SDimitry Andric    MLInlineAdvice::recordInliningImpl();
e8d8bef9SDimitry Andric    getAdvisor()->resetNativeSize(Caller);
e8d8bef9SDimitry Andric    int Reward = std::numeric_limits<int>::max();
e8d8bef9SDimitry Andric    if (InlineSizeEstimatorAnalysis::isEvaluatorRequested() &&
e8d8bef9SDimitry Andric        !getAdvisor()->isForcedToStop()) {
e8d8bef9SDimitry Andric      int NativeSizeAfter = *getAdvisor()->getNativeSizeEstimate(*Caller) +
e8d8bef9SDimitry Andric                            *CalleeSizeEstimateBefore;
e8d8bef9SDimitry Andric      Reward = NativeSizeAfter -
e8d8bef9SDimitry Andric               (*CallerSizeEstimateBefore + *CalleeSizeEstimateBefore);
e8d8bef9SDimitry Andric      getAdvisor()->updateNativeSizeEstimate(Reward);
e8d8bef9SDimitry Andric    }
e8d8bef9SDimitry Andric    log(Reward, /*Success=*/true);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  void recordInliningWithCalleeDeletedImpl() override {
e8d8bef9SDimitry Andric    MLInlineAdvice::recordInliningWithCalleeDeletedImpl();
e8d8bef9SDimitry Andric    getAdvisor()->resetNativeSize(Caller);
e8d8bef9SDimitry Andric    if (InlineSizeEstimatorAnalysis::isEvaluatorRequested() &&
e8d8bef9SDimitry Andric        !getAdvisor()->isForcedToStop()) {
e8d8bef9SDimitry Andric      int NativeSizeAfter = *getAdvisor()->getNativeSizeEstimate(*Caller);
e8d8bef9SDimitry Andric      int Reward = NativeSizeAfter -
e8d8bef9SDimitry Andric                   (*CallerSizeEstimateBefore + *CalleeSizeEstimateBefore);
e8d8bef9SDimitry Andric      getAdvisor()->updateNativeSizeEstimate(Reward);
e8d8bef9SDimitry Andric      log(Reward, /*Success=*/true);
349cc55cSDimitry Andric    } else {
349cc55cSDimitry Andric      log(NoReward, /*Success=*/true);
e8d8bef9SDimitry Andric    }
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  void recordUnsuccessfulInliningImpl(const InlineResult &Result) override {
e8d8bef9SDimitry Andric    MLInlineAdvice::recordUnsuccessfulInliningImpl(Result);
e8d8bef9SDimitry Andric    log(NoReward, /*Success=*/false);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  void recordUnattemptedInliningImpl() override {
e8d8bef9SDimitry Andric    MLInlineAdvice::recordUnattemptedInliningImpl();
e8d8bef9SDimitry Andric    log(NoReward, /*Success=*/false);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  void log(int64_t Reward, bool Success) {
e8d8bef9SDimitry Andric    if (Mandatory)
e8d8bef9SDimitry Andric      return;
e8d8bef9SDimitry Andric    InlineEvent Event;
e8d8bef9SDimitry Andric    Event.AdvisedDecision = isInliningRecommended();
e8d8bef9SDimitry Andric    Event.DefaultDecision = DefaultDecision;
e8d8bef9SDimitry Andric    Event.Effect = Success;
e8d8bef9SDimitry Andric    Event.Reward = Reward;
e8d8bef9SDimitry Andric    Logger.logInlineEvent(Event, getAdvisor()->getModelRunner());
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  static const int64_t NoReward = 0;
e8d8bef9SDimitry Andric  TrainingLogger &Logger;
bdd1243dSDimitry Andric  const std::optional<size_t> CallerSizeEstimateBefore;
bdd1243dSDimitry Andric  const std::optional<size_t> CalleeSizeEstimateBefore;
e8d8bef9SDimitry Andric  const int64_t DefaultDecision;
e8d8bef9SDimitry Andric  const int64_t Mandatory;
e8d8bef9SDimitry Andric};
e8d8bef9SDimitry Andric
0eae32dcSDimitry Andricstatic const std::vector<TensorSpec> TrainingOnlyFeatures{
e8d8bef9SDimitry Andric    TensorSpec::createSpec<int64_t>(TFFeedPrefix + "inlining_default", {1}),
e8d8bef9SDimitry Andric    TensorSpec::createSpec<float>(TFFeedPrefix + "discount", {1}),
e8d8bef9SDimitry Andric    TensorSpec::createSpec<float>(TFFeedPrefix + "reward", {1}),
e8d8bef9SDimitry Andric    TensorSpec::createSpec<int32_t>(TFFeedPrefix + "step_type", {1})};
0eae32dcSDimitry Andric
0eae32dcSDimitry Andricstatic const std::vector<TensorSpec> getInputFeatures() {
0eae32dcSDimitry Andric  std::vector<TensorSpec> InputSpecs;
0eae32dcSDimitry Andric  for (size_t I = 0; I < NumberOfFeatures; ++I)
81ad6265SDimitry Andric    InputSpecs.push_back(TensorSpec::createSpec<int64_t>(
81ad6265SDimitry Andric        TFFeedPrefix + FeatureMap[I].name(), FeatureMap[I].shape()));
0eae32dcSDimitry Andric  append_range(InputSpecs, TrainingOnlyFeatures);
0eae32dcSDimitry Andric  return InputSpecs;
0eae32dcSDimitry Andric}
0eae32dcSDimitry Andric
e8d8bef9SDimitry Andric} // namespace
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricTrainingLogger::TrainingLogger(StringRef LogFileName,
e8d8bef9SDimitry Andric                               const ModelUnderTrainingRunner *MUTR)
e8d8bef9SDimitry Andric    : LogFileName(LogFileName), MUTR(MUTR) {
e8d8bef9SDimitry Andric  // The first output is the inlining decision.
bdd1243dSDimitry Andric  std::vector<TensorSpec> FT(FeatureMap.begin(), FeatureMap.end());
e8d8bef9SDimitry Andric
bdd1243dSDimitry Andric  if (MUTR)
bdd1243dSDimitry Andric    append_range(FT, MUTR->extraOutputsForLoggingSpecs());
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  DefaultDecisionPos = FT.size();
fe013be4SDimitry Andric  FT.push_back(DefaultDecisionSpec);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  DecisionPos = FT.size();
fe013be4SDimitry Andric  FT.push_back(InlineDecisionSpec);
bdd1243dSDimitry Andric  std::error_code EC;
bdd1243dSDimitry Andric  auto OS = std::make_unique<raw_fd_ostream>(TrainingLog, EC);
bdd1243dSDimitry Andric  if (EC)
bdd1243dSDimitry Andric    dbgs() << (EC.message() + ":" + TrainingLog);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  L = std::make_unique<Logger>(
bdd1243dSDimitry Andric      std::move(OS), FT, TensorSpec::createSpec<int64_t>(RewardName, {1}),
e8d8bef9SDimitry Andric      InlineSizeEstimatorAnalysis::isEvaluatorRequested());
bdd1243dSDimitry Andric  L->switchContext("");
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric/// Log one inlining event.
e8d8bef9SDimitry Andricvoid TrainingLogger::logInlineEvent(const InlineEvent &Event,
e8d8bef9SDimitry Andric                                    const MLModelRunner &ModelRunner) {
bdd1243dSDimitry Andric  L->startObservation();
e8d8bef9SDimitry Andric  size_t CurrentFeature = 0;
bdd1243dSDimitry Andric  for (; CurrentFeature < NumberOfFeatures; ++CurrentFeature)
bdd1243dSDimitry Andric    L->logTensorValue(CurrentFeature,
bdd1243dSDimitry Andric                      reinterpret_cast<const char *>(
bdd1243dSDimitry Andric                          ModelRunner.getTensorUntyped(CurrentFeature)));
e8d8bef9SDimitry Andric
bdd1243dSDimitry Andric  if (MUTR)
bdd1243dSDimitry Andric    for (size_t I = 0; I < MUTR->extraOutputsForLoggingSpecs().size(); ++I) {
e8d8bef9SDimitry Andric      const char *RawData =
bdd1243dSDimitry Andric          reinterpret_cast<const char *>(MUTR->getUntypedExtraOutputValue(I));
bdd1243dSDimitry Andric      L->logTensorValue(CurrentFeature, RawData);
e8d8bef9SDimitry Andric      ++CurrentFeature;
e8d8bef9SDimitry Andric    }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  assert(CurrentFeature == DefaultDecisionPos);
bdd1243dSDimitry Andric  L->logTensorValue(DefaultDecisionPos,
bdd1243dSDimitry Andric                    reinterpret_cast<const char *>(&Event.DefaultDecision));
bdd1243dSDimitry Andric  L->logTensorValue(DecisionPos,
bdd1243dSDimitry Andric                    reinterpret_cast<const char *>(&Event.AdvisedDecision));
bdd1243dSDimitry Andric  L->endObservation();
e8d8bef9SDimitry Andric  if (InlineSizeEstimatorAnalysis::isEvaluatorRequested())
bdd1243dSDimitry Andric    L->logReward(Event.Reward);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  // For debugging / later use
e8d8bef9SDimitry Andric  Effects.push_back(Event.Effect);
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricDevelopmentModeMLInlineAdvisor::DevelopmentModeMLInlineAdvisor(
e8d8bef9SDimitry Andric    Module &M, ModuleAnalysisManager &MAM,
e8d8bef9SDimitry Andric    std::unique_ptr<MLModelRunner> ModelRunner,
04eeddc0SDimitry Andric    std::function<bool(CallBase &)> GetDefaultAdvice,
e8d8bef9SDimitry Andric    std::unique_ptr<TrainingLogger> Logger)
fe013be4SDimitry Andric    : MLInlineAdvisor(M, MAM, std::move(ModelRunner), GetDefaultAdvice),
04eeddc0SDimitry Andric      IsDoingInference(isa<ModelUnderTrainingRunner>(getModelRunner())),
e8d8bef9SDimitry Andric      Logger(std::move(Logger)),
e8d8bef9SDimitry Andric      InitialNativeSize(isLogging() ? getTotalSizeEstimate() : 0),
e8d8bef9SDimitry Andric      CurrentNativeSize(InitialNativeSize) {
e8d8bef9SDimitry Andric  // We cannot have the case of neither inference nor logging.
e8d8bef9SDimitry Andric  assert(IsDoingInference || isLogging());
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
bdd1243dSDimitry Andricstd::optional<size_t>
e8d8bef9SDimitry AndricDevelopmentModeMLInlineAdvisor::getNativeSizeEstimate(const Function &F) const {
e8d8bef9SDimitry Andric  if (!InlineSizeEstimatorAnalysis::isEvaluatorRequested())
bdd1243dSDimitry Andric    return std::nullopt;
e8d8bef9SDimitry Andric  auto &R =
e8d8bef9SDimitry Andric      FAM.getResult<InlineSizeEstimatorAnalysis>(const_cast<Function &>(F));
e8d8bef9SDimitry Andric  if (!R) {
e8d8bef9SDimitry Andric    F.getParent()->getContext().emitError(
e8d8bef9SDimitry Andric        "Native size estimator is not present.");
e8d8bef9SDimitry Andric    return 0;
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric  return *R;
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstd::unique_ptr<MLInlineAdvice>
e8d8bef9SDimitry AndricDevelopmentModeMLInlineAdvisor::getMandatoryAdviceImpl(CallBase &CB) {
e8d8bef9SDimitry Andric  return std::make_unique<LoggingMLInlineAdvice>(
e8d8bef9SDimitry Andric      /*Advisor=*/this,
e8d8bef9SDimitry Andric      /*CB=*/CB, /*ORE=*/getCallerORE(CB), /*Recommendation=*/true,
e8d8bef9SDimitry Andric      /*Logger=*/*Logger,
e8d8bef9SDimitry Andric      /*CallerSizeEstimateBefore=*/getNativeSizeEstimate(*CB.getCaller()),
e8d8bef9SDimitry Andric      /*CalleeSizeEstimateBefore=*/
e8d8bef9SDimitry Andric      getNativeSizeEstimate(*CB.getCalledFunction()),
e8d8bef9SDimitry Andric      /*DefaultDecision=*/true, /*Mandatory*/ true);
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstd::unique_ptr<MLInlineAdvice>
e8d8bef9SDimitry AndricDevelopmentModeMLInlineAdvisor::getAdviceFromModel(
e8d8bef9SDimitry Andric    CallBase &CB, OptimizationRemarkEmitter &ORE) {
e8d8bef9SDimitry Andric  if (IsDoingInference && !isLogging())
e8d8bef9SDimitry Andric    return MLInlineAdvisor::getAdviceFromModel(CB, ORE);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  bool DefaultAdvice = GetDefaultAdvice(CB);
0eae32dcSDimitry Andric  auto Recommendation =
0eae32dcSDimitry Andric      IsDoingInference ? static_cast<bool>(ModelRunner->evaluate<int64_t>())
0eae32dcSDimitry Andric                       : DefaultAdvice;
e8d8bef9SDimitry Andric  return std::make_unique<LoggingMLInlineAdvice>(
e8d8bef9SDimitry Andric      /*Advisor=*/this,
e8d8bef9SDimitry Andric      /*CB=*/CB, /*ORE=*/ORE, /*Recommendation=*/Recommendation,
e8d8bef9SDimitry Andric      /*Logger=*/*Logger,
e8d8bef9SDimitry Andric      /*CallerSizeEstimateBefore=*/getNativeSizeEstimate(*CB.getCaller()),
e8d8bef9SDimitry Andric      /*CalleeSizeEstimateBefore=*/
e8d8bef9SDimitry Andric      getNativeSizeEstimate(*CB.getCalledFunction()),
e8d8bef9SDimitry Andric      /*DefaultDecision=*/DefaultAdvice);
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricsize_t DevelopmentModeMLInlineAdvisor::getTotalSizeEstimate() {
e8d8bef9SDimitry Andric  if (!InlineSizeEstimatorAnalysis::isEvaluatorRequested())
e8d8bef9SDimitry Andric    return 0;
e8d8bef9SDimitry Andric  size_t Ret = 0;
e8d8bef9SDimitry Andric  for (auto &F : M) {
e8d8bef9SDimitry Andric    if (F.isDeclaration())
e8d8bef9SDimitry Andric      continue;
e8d8bef9SDimitry Andric    Ret += *getNativeSizeEstimate(F);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric  return Ret;
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstd::unique_ptr<InlineAdvisor> llvm::getDevelopmentModeAdvisor(
e8d8bef9SDimitry Andric    Module &M, ModuleAnalysisManager &MAM,
e8d8bef9SDimitry Andric    std::function<bool(CallBase &)> GetDefaultAdvice) {
e8d8bef9SDimitry Andric  auto &Ctx = M.getContext();
e8d8bef9SDimitry Andric  std::unique_ptr<MLModelRunner> Runner;
e8d8bef9SDimitry Andric  if (TFModelUnderTrainingPath.empty())
0eae32dcSDimitry Andric    Runner.reset(new NoInferenceModelRunner(Ctx, getInputFeatures()));
04eeddc0SDimitry Andric  else
04eeddc0SDimitry Andric    Runner = ModelUnderTrainingRunner::createAndEnsureValid(
04eeddc0SDimitry Andric        Ctx, TFModelUnderTrainingPath, DecisionName, getInputFeatures(),
04eeddc0SDimitry Andric        TFOutputSpecOverride);
04eeddc0SDimitry Andric  if (!Runner)
e8d8bef9SDimitry Andric    return nullptr;
e8d8bef9SDimitry Andric  std::unique_ptr<TrainingLogger> Logger;
e8d8bef9SDimitry Andric  if (!TrainingLog.empty())
04eeddc0SDimitry Andric    Logger = std::make_unique<TrainingLogger>(
04eeddc0SDimitry Andric        TrainingLog, dyn_cast<ModelUnderTrainingRunner>(Runner.get()));
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  return std::make_unique<DevelopmentModeMLInlineAdvisor>(
04eeddc0SDimitry Andric      M, MAM, std::move(Runner), GetDefaultAdvice, std::move(Logger));
e8d8bef9SDimitry Andric}
bdd1243dSDimitry Andric#endif // defined(LLVM_HAVE_TFLITE)