lib/Analysis/DevelopmentModeInlineAdvisor.cpp

e8d8bef9SDimitry Andric//===- DevelopmentModeInlineAdvisor.cpp - runtime-loadable model runner  --===//
e8d8bef9SDimitry Andric//
e8d8bef9SDimitry Andric//                     The LLVM Compiler Infrastructure
e8d8bef9SDimitry Andric//
e8d8bef9SDimitry Andric// This file is distributed under the University of Illinois Open Source
e8d8bef9SDimitry Andric// License. See LICENSE.TXT for details.
e8d8bef9SDimitry Andric//
e8d8bef9SDimitry Andric//===----------------------------------------------------------------------===//
e8d8bef9SDimitry Andric//
e8d8bef9SDimitry Andric// This file implements a model runner using Tensorflow C APIs, allowing the
e8d8bef9SDimitry Andric// loading of a model from a command line option.
e8d8bef9SDimitry Andric//
e8d8bef9SDimitry Andric//===----------------------------------------------------------------------===//
e8d8bef9SDimitry Andric#include "llvm/Config/config.h"
e8d8bef9SDimitry Andric#if defined(LLVM_HAVE_TF_API)
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric#include "llvm/Analysis/CallGraph.h"
e8d8bef9SDimitry Andric#include "llvm/Analysis/InlineSizeEstimatorAnalysis.h"
e8d8bef9SDimitry Andric#include "llvm/Analysis/MLInlineAdvisor.h"
e8d8bef9SDimitry Andric#include "llvm/Analysis/Utils/TFUtils.h"
e8d8bef9SDimitry Andric#include "llvm/IR/LLVMContext.h"
e8d8bef9SDimitry Andric#include "llvm/Support/CommandLine.h"
e8d8bef9SDimitry Andric#include "llvm/Support/ManagedStatic.h"
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric#include <vector>
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricusing namespace llvm;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstatic cl::opt<std::string> TrainingLog(
e8d8bef9SDimitry Andric    "training-log", cl::Hidden,
e8d8bef9SDimitry Andric    cl::desc("Path where the development - mode inlining log is saved."));
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstatic cl::opt<std::string> TFModelUnderTrainingPath(
e8d8bef9SDimitry Andric    "ml-inliner-model-under-training", cl::Hidden,
e8d8bef9SDimitry Andric    cl::desc(R"(Path to SavedModel from the previous training iteration.
e8d8bef9SDimitry AndricThe directory is also expected to contain a JSON specification of the
e8d8bef9SDimitry Andricoutputs expected to be logged, where the first entry must be the
e8d8bef9SDimitry Andricinlining decision. The file containing the specification should be
e8d8bef9SDimitry Andriccalled output_spec.json. The expected JSON value is an array of
e8d8bef9SDimitry Andricdictionaries. Each dictionary should have 2 keys:
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric- "tensor_spec, followed by the TensorSpec description of the
e8d8bef9SDimitry Andricoutput; and
e8d8bef9SDimitry Andric- "logging_name", a string indicating the name to use when
e8d8bef9SDimitry Andriclogging the output values.
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricExample:
e8d8bef9SDimitry Andric[
e8d8bef9SDimitry Andric  {
e8d8bef9SDimitry Andric    "logging_name" : "some_name",
e8d8bef9SDimitry Andric    "tensor_spec" : {
e8d8bef9SDimitry Andric      "name" : "model_name",
e8d8bef9SDimitry Andric      "port" : 0,
e8d8bef9SDimitry Andric      "shape" : [2, 3],
e8d8bef9SDimitry Andric      "type" : "float"
e8d8bef9SDimitry Andric      }
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric]
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricThe first value must always correspond to the decision.)"));
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstatic cl::opt<std::string> TFOutputSpecOverride(
e8d8bef9SDimitry Andric    "ml-inliner-output-spec-override", cl::Hidden,
e8d8bef9SDimitry Andric    cl::desc("Override the path to the output spec json file. See "
e8d8bef9SDimitry Andric             "-ml-inliner-model-under-training documentation for the "
e8d8bef9SDimitry Andric             "specification of that file."));
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstatic cl::opt<std::string> TFFeedPrefix("ml-inliner-trained-model-feed-prefix",
e8d8bef9SDimitry Andric                                         cl::Hidden, cl::init("action_"),
e8d8bef9SDimitry Andric                                         cl::desc("Prefix for feature names."));
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricnamespace {
e8d8bef9SDimitry Andric/// An InlineEvent, used by TrainingLogger.
e8d8bef9SDimitry Andricstruct InlineEvent {
e8d8bef9SDimitry Andric  /// What the default policy's decision would have been.
e8d8bef9SDimitry Andric  int64_t DefaultDecision = 0;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  /// What we advised. When training off the default policy, this is the same as
e8d8bef9SDimitry Andric  /// DefaultDecision.
e8d8bef9SDimitry Andric  int64_t AdvisedDecision = 0;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  /// What actually happened. This would be 'false' in the case of an inline
e8d8bef9SDimitry Andric  /// error, even if AdvisedDecision were true, otherwise it agrees with
e8d8bef9SDimitry Andric  /// AdvisedDecision.
e8d8bef9SDimitry Andric  bool Effect = false;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  /// What the change in size was: size_after - size_before
e8d8bef9SDimitry Andric  int64_t Reward = 0;
e8d8bef9SDimitry Andric};
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric/// Collect data we may use for training a model, and write it as a textual
e8d8bef9SDimitry Andric/// Tensorflow SequenceExample
e8d8bef9SDimitry Andric/// (https://www.tensorflow.org/api_docs/python/tf/train/SequenceExample)
e8d8bef9SDimitry Andric/// protobuf (https://developers.google.com/protocol-buffers).
e8d8bef9SDimitry Andric/// Because this is a protobuf, we cannot just stream the events as they come.
e8d8bef9SDimitry Andric/// Internally, TrainingLogger stores data in column-major format, because that
e8d8bef9SDimitry Andric/// lines up with how TF SequenceExample represents it.
e8d8bef9SDimitry Andricclass ModelUnderTrainingRunner;
e8d8bef9SDimitry Andricclass TrainingLogger final {
e8d8bef9SDimitry Andricpublic:
e8d8bef9SDimitry Andric  TrainingLogger(StringRef LogFileName, const ModelUnderTrainingRunner *MUTR);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  /// Log one inlining event.
e8d8bef9SDimitry Andric  void logInlineEvent(const InlineEvent &Event,
e8d8bef9SDimitry Andric                      const MLModelRunner &ModelRunner);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  /// Print the stored tensors.
e8d8bef9SDimitry Andric  void print();
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricprivate:
e8d8bef9SDimitry Andric  StringRef LogFileName;
e8d8bef9SDimitry Andric  const ModelUnderTrainingRunner *const MUTR;
e8d8bef9SDimitry Andric  std::unique_ptr<Logger> L;
e8d8bef9SDimitry Andric  std::vector<bool> Effects;
e8d8bef9SDimitry Andric  /// There's at least one output. We'll set this to a different value if MUTR
e8d8bef9SDimitry Andric  /// is avaliable.
e8d8bef9SDimitry Andric  size_t OutputCount = 1;
e8d8bef9SDimitry Andric  /// Set these 2 clearly OOB, to make sure we set them later.
e8d8bef9SDimitry Andric  size_t DefaultDecisionPos = std::numeric_limits<size_t>::max();
e8d8bef9SDimitry Andric  size_t DecisionPos = std::numeric_limits<size_t>::max();
e8d8bef9SDimitry Andric};
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric/// An extension of the MLInlineAdvisor for the 'development' mode, targeting
e8d8bef9SDimitry Andric/// the offline training scenario. Note that training happens outside of the
e8d8bef9SDimitry Andric/// compiler, this facility is concerned with producing training data ("logs").
e8d8bef9SDimitry Andric/// This InlineAdvisor can operate in the following modes:
e8d8bef9SDimitry Andric///
e8d8bef9SDimitry Andric/// 1) collect logs for the default policy. This is useful for bootstrapping
e8d8bef9SDimitry Andric/// training, which will be considerably faster by starting from a reasonable
e8d8bef9SDimitry Andric/// policy.
e8d8bef9SDimitry Andric///
e8d8bef9SDimitry Andric/// 2) collect logs for the ML policy, using a model from a previous
e8d8bef9SDimitry Andric/// training. Potentially, that model uses internally some small random
e8d8bef9SDimitry Andric/// perturbation of its weights, to induce exploration (setting this up is the
e8d8bef9SDimitry Andric/// responsibility of the training algorithm). The logs would then be used to
e8d8bef9SDimitry Andric/// retrain and improve on this model.
e8d8bef9SDimitry Andric///
e8d8bef9SDimitry Andric/// 3) use the provided model, with no logging. This is useful for end to end
e8d8bef9SDimitry Andric/// validation - the model, in this case, is a release candidate and shouldn't
e8d8bef9SDimitry Andric/// have random perturbations. It is a convenience feature: rather than needing
e8d8bef9SDimitry Andric/// to take the release candidate model and compile it in 'release' mode,
e8d8bef9SDimitry Andric/// validate it, then potentially discard it, it's easier to just pass the model
e8d8bef9SDimitry Andric/// to the compiler, albeit compilation would be slower, as a one-off. Once the
e8d8bef9SDimitry Andric/// model behaves satisfactorily, it can be compiled AOT, for efficiency, in
e8d8bef9SDimitry Andric/// release mode. The expectation is that a well-trained model provides a good
e8d8bef9SDimitry Andric/// policy over a sufficiently diverse codebase, over many changes (i.e.
e8d8bef9SDimitry Andric/// training happens seldom).
e8d8bef9SDimitry Andricclass DevelopmentModeMLInlineAdvisor : public MLInlineAdvisor {
e8d8bef9SDimitry Andricpublic:
e8d8bef9SDimitry Andric  DevelopmentModeMLInlineAdvisor(
e8d8bef9SDimitry Andric      Module &M, ModuleAnalysisManager &MAM,
e8d8bef9SDimitry Andric      std::unique_ptr<MLModelRunner> ModelRunner,
e8d8bef9SDimitry Andric      std::function<bool(CallBase &)> GetDefaultAdvice, bool IsDoingInference,
e8d8bef9SDimitry Andric      std::unique_ptr<TrainingLogger> Logger);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  size_t getTotalSizeEstimate();
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  virtual ~DevelopmentModeMLInlineAdvisor();
e8d8bef9SDimitry Andric  void updateNativeSizeEstimate(int64_t Change) {
e8d8bef9SDimitry Andric    *CurrentNativeSize += Change;
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric  void resetNativeSize(Function *F) {
*fe6060f1SDimitry Andric    PreservedAnalyses PA = PreservedAnalyses::all();
*fe6060f1SDimitry Andric    PA.abandon<InlineSizeEstimatorAnalysis>();
*fe6060f1SDimitry Andric    FAM.invalidate(*F, PA);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  std::unique_ptr<MLInlineAdvice>
e8d8bef9SDimitry Andric  getAdviceFromModel(CallBase &CB, OptimizationRemarkEmitter &ORE) override;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  Optional<size_t> getNativeSizeEstimate(const Function &F) const;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricprivate:
e8d8bef9SDimitry Andric  bool isLogging() const { return !!Logger; }
e8d8bef9SDimitry Andric  std::unique_ptr<MLInlineAdvice> getMandatoryAdviceImpl(CallBase &CB) override;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  std::function<bool(CallBase &)> GetDefaultAdvice;
e8d8bef9SDimitry Andric  const bool IsDoingInference;
e8d8bef9SDimitry Andric  std::unique_ptr<TrainingLogger> Logger;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  const Optional<int32_t> InitialNativeSize;
e8d8bef9SDimitry Andric  Optional<int32_t> CurrentNativeSize;
e8d8bef9SDimitry Andric};
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric/// A variant of MLInlineAdvice that tracks all non-trivial inlining
e8d8bef9SDimitry Andric/// decisions, for training/logging.
e8d8bef9SDimitry Andricclass LoggingMLInlineAdvice : public MLInlineAdvice {
e8d8bef9SDimitry Andricpublic:
e8d8bef9SDimitry Andric  LoggingMLInlineAdvice(DevelopmentModeMLInlineAdvisor *Advisor, CallBase &CB,
e8d8bef9SDimitry Andric                        OptimizationRemarkEmitter &ORE, bool Recommendation,
e8d8bef9SDimitry Andric                        TrainingLogger &Logger,
e8d8bef9SDimitry Andric                        Optional<size_t> CallerSizeEstimateBefore,
e8d8bef9SDimitry Andric                        Optional<size_t> CalleeSizeEstimateBefore,
e8d8bef9SDimitry Andric                        bool DefaultDecision, bool Mandatory = false)
e8d8bef9SDimitry Andric      : MLInlineAdvice(Advisor, CB, ORE, Recommendation), Logger(Logger),
e8d8bef9SDimitry Andric        CallerSizeEstimateBefore(CallerSizeEstimateBefore),
e8d8bef9SDimitry Andric        CalleeSizeEstimateBefore(CalleeSizeEstimateBefore),
e8d8bef9SDimitry Andric        DefaultDecision(DefaultDecision), Mandatory(Mandatory) {}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  virtual ~LoggingMLInlineAdvice() = default;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricprivate:
e8d8bef9SDimitry Andric  DevelopmentModeMLInlineAdvisor *getAdvisor() const {
e8d8bef9SDimitry Andric    return static_cast<DevelopmentModeMLInlineAdvisor *>(Advisor);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric  void recordInliningImpl() override {
e8d8bef9SDimitry Andric    MLInlineAdvice::recordInliningImpl();
e8d8bef9SDimitry Andric    getAdvisor()->resetNativeSize(Caller);
e8d8bef9SDimitry Andric    int Reward = std::numeric_limits<int>::max();
e8d8bef9SDimitry Andric    if (InlineSizeEstimatorAnalysis::isEvaluatorRequested() &&
e8d8bef9SDimitry Andric        !getAdvisor()->isForcedToStop()) {
e8d8bef9SDimitry Andric      int NativeSizeAfter = *getAdvisor()->getNativeSizeEstimate(*Caller) +
e8d8bef9SDimitry Andric                            *CalleeSizeEstimateBefore;
e8d8bef9SDimitry Andric      Reward = NativeSizeAfter -
e8d8bef9SDimitry Andric               (*CallerSizeEstimateBefore + *CalleeSizeEstimateBefore);
e8d8bef9SDimitry Andric      getAdvisor()->updateNativeSizeEstimate(Reward);
e8d8bef9SDimitry Andric    }
e8d8bef9SDimitry Andric    log(Reward, /*Success=*/true);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  void recordInliningWithCalleeDeletedImpl() override {
e8d8bef9SDimitry Andric    MLInlineAdvice::recordInliningWithCalleeDeletedImpl();
e8d8bef9SDimitry Andric    getAdvisor()->resetNativeSize(Caller);
e8d8bef9SDimitry Andric    if (InlineSizeEstimatorAnalysis::isEvaluatorRequested() &&
e8d8bef9SDimitry Andric        !getAdvisor()->isForcedToStop()) {
e8d8bef9SDimitry Andric      int NativeSizeAfter = *getAdvisor()->getNativeSizeEstimate(*Caller);
e8d8bef9SDimitry Andric      int Reward = NativeSizeAfter -
e8d8bef9SDimitry Andric                   (*CallerSizeEstimateBefore + *CalleeSizeEstimateBefore);
e8d8bef9SDimitry Andric      getAdvisor()->updateNativeSizeEstimate(Reward);
e8d8bef9SDimitry Andric      log(Reward, /*Success=*/true);
e8d8bef9SDimitry Andric    }
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  void recordUnsuccessfulInliningImpl(const InlineResult &Result) override {
e8d8bef9SDimitry Andric    MLInlineAdvice::recordUnsuccessfulInliningImpl(Result);
e8d8bef9SDimitry Andric    log(NoReward, /*Success=*/false);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  void recordUnattemptedInliningImpl() override {
e8d8bef9SDimitry Andric    MLInlineAdvice::recordUnattemptedInliningImpl();
e8d8bef9SDimitry Andric    log(NoReward, /*Success=*/false);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  void log(int64_t Reward, bool Success) {
e8d8bef9SDimitry Andric    if (Mandatory)
e8d8bef9SDimitry Andric      return;
e8d8bef9SDimitry Andric    InlineEvent Event;
e8d8bef9SDimitry Andric    Event.AdvisedDecision = isInliningRecommended();
e8d8bef9SDimitry Andric    Event.DefaultDecision = DefaultDecision;
e8d8bef9SDimitry Andric    Event.Effect = Success;
e8d8bef9SDimitry Andric    Event.Reward = Reward;
e8d8bef9SDimitry Andric    Logger.logInlineEvent(Event, getAdvisor()->getModelRunner());
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  static const int64_t NoReward = 0;
e8d8bef9SDimitry Andric  TrainingLogger &Logger;
e8d8bef9SDimitry Andric  const Optional<size_t> CallerSizeEstimateBefore;
e8d8bef9SDimitry Andric  const Optional<size_t> CalleeSizeEstimateBefore;
e8d8bef9SDimitry Andric  const int64_t DefaultDecision;
e8d8bef9SDimitry Andric  const int64_t Mandatory;
e8d8bef9SDimitry Andric};
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric/// A pseudo model runner. We use it to store feature values when collecting
e8d8bef9SDimitry Andric/// logs for the default policy, but never ask it to 'run'.
e8d8bef9SDimitry Andricclass NoInferenceModelRunner : public MLModelRunner {
e8d8bef9SDimitry Andricpublic:
e8d8bef9SDimitry Andric  NoInferenceModelRunner(LLVMContext &Ctx)
e8d8bef9SDimitry Andric      : MLModelRunner(Ctx), Features(NumberOfFeatures) {}
e8d8bef9SDimitry Andric  void setFeature(FeatureIndex Index, int64_t Value) override {
e8d8bef9SDimitry Andric    Features[static_cast<int>(Index)] = Value;
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  int64_t getFeature(int Index) const override { return Features[Index]; }
e8d8bef9SDimitry Andric  bool run() override {
e8d8bef9SDimitry Andric    llvm_unreachable("We shouldn't call run on this model runner.");
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricprivate:
e8d8bef9SDimitry Andric  InlineFeatures Features;
e8d8bef9SDimitry Andric};
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric/// ModelUnderTrainingRunner - training mode implementation. It uses TF C APIs
e8d8bef9SDimitry Andric/// to dynamically load and evaluate a TF SavedModel
e8d8bef9SDimitry Andric/// (https://www.tensorflow.org/guide/saved_model). Runtime performance is
e8d8bef9SDimitry Andric/// sacrificed for ease of use while training.
e8d8bef9SDimitry Andricclass ModelUnderTrainingRunner final : public MLModelRunner {
e8d8bef9SDimitry Andricpublic:
e8d8bef9SDimitry Andric  ModelUnderTrainingRunner(LLVMContext &Ctx, const std::string &ModelPath);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  bool run() override;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  // Disallows copy and assign.
e8d8bef9SDimitry Andric  ModelUnderTrainingRunner(const ModelUnderTrainingRunner &) = delete;
e8d8bef9SDimitry Andric  ModelUnderTrainingRunner &
e8d8bef9SDimitry Andric  operator=(const ModelUnderTrainingRunner &) = delete;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  void setFeature(FeatureIndex Index, int64_t Value) override;
e8d8bef9SDimitry Andric  int64_t getFeature(int Index) const override;
e8d8bef9SDimitry Andric  bool isValid() const { return !!Evaluator; }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  const std::vector<LoggedFeatureSpec> &outputLoggedFeatureSpecs() const {
e8d8bef9SDimitry Andric    return OutputSpecs;
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  const Optional<TFModelEvaluator::EvaluationResult> &
e8d8bef9SDimitry Andric  lastEvaluationResult() const {
e8d8bef9SDimitry Andric    return LastEvaluationResult;
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricprivate:
e8d8bef9SDimitry Andric  std::unique_ptr<TFModelEvaluator> Evaluator;
e8d8bef9SDimitry Andric  std::vector<LoggedFeatureSpec> OutputSpecs;
e8d8bef9SDimitry Andric  Optional<TFModelEvaluator::EvaluationResult> LastEvaluationResult;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  // The training framework needs some additional features.
e8d8bef9SDimitry Andric  const std::vector<TensorSpec> TrainingOnlyFeatures{
e8d8bef9SDimitry Andric      TensorSpec::createSpec<int64_t>(TFFeedPrefix + "inlining_default", {1}),
e8d8bef9SDimitry Andric      TensorSpec::createSpec<float>(TFFeedPrefix + "discount", {1}),
e8d8bef9SDimitry Andric      TensorSpec::createSpec<float>(TFFeedPrefix + "reward", {1}),
e8d8bef9SDimitry Andric      TensorSpec::createSpec<int32_t>(TFFeedPrefix + "step_type", {1})};
e8d8bef9SDimitry Andric};
e8d8bef9SDimitry Andric} // namespace
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricTrainingLogger::TrainingLogger(StringRef LogFileName,
e8d8bef9SDimitry Andric                               const ModelUnderTrainingRunner *MUTR)
e8d8bef9SDimitry Andric    : LogFileName(LogFileName), MUTR(MUTR) {
e8d8bef9SDimitry Andric  // The first output is the inlining decision.
e8d8bef9SDimitry Andric  if (MUTR)
e8d8bef9SDimitry Andric    OutputCount = MUTR->outputLoggedFeatureSpecs().size();
e8d8bef9SDimitry Andric  std::vector<LoggedFeatureSpec> FT;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  for (size_t I = 0; I < NumberOfFeatures; ++I)
e8d8bef9SDimitry Andric    FT.push_back(
e8d8bef9SDimitry Andric        {TensorSpec::createSpec<int64_t>(FeatureNameMap.at(I), {1}), None});
e8d8bef9SDimitry Andric  if (MUTR && MUTR->outputLoggedFeatureSpecs().size() > 1)
e8d8bef9SDimitry Andric    append_range(FT, drop_begin(MUTR->outputLoggedFeatureSpecs()));
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  DefaultDecisionPos = FT.size();
e8d8bef9SDimitry Andric  FT.push_back(
e8d8bef9SDimitry Andric      {TensorSpec::createSpec<int64_t>(DefaultDecisionName, {1}), None});
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  DecisionPos = FT.size();
e8d8bef9SDimitry Andric  FT.push_back({TensorSpec::createSpec<int64_t>(DecisionName, {1}), None});
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  L = std::make_unique<Logger>(
e8d8bef9SDimitry Andric      FT, TensorSpec::createSpec<int64_t>(RewardName, {1}),
e8d8bef9SDimitry Andric      InlineSizeEstimatorAnalysis::isEvaluatorRequested());
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric/// Log one inlining event.
e8d8bef9SDimitry Andricvoid TrainingLogger::logInlineEvent(const InlineEvent &Event,
e8d8bef9SDimitry Andric                                    const MLModelRunner &ModelRunner) {
e8d8bef9SDimitry Andric  size_t CurrentFeature = 0;
e8d8bef9SDimitry Andric  for (; CurrentFeature < NumberOfFeatures; ++CurrentFeature) {
e8d8bef9SDimitry Andric    int64_t F = ModelRunner.getFeature(CurrentFeature);
*fe6060f1SDimitry Andric    L->logInt64Value(CurrentFeature, &F);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  for (size_t I = 1; I < OutputCount; ++I) {
e8d8bef9SDimitry Andric    const auto &Result = *MUTR->lastEvaluationResult();
e8d8bef9SDimitry Andric    const char *RawData =
e8d8bef9SDimitry Andric        reinterpret_cast<const char *>(Result.getUntypedTensorValue(I));
*fe6060f1SDimitry Andric    L->logSpecifiedTensorValue(CurrentFeature, RawData);
e8d8bef9SDimitry Andric    ++CurrentFeature;
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  assert(CurrentFeature == DefaultDecisionPos);
*fe6060f1SDimitry Andric  L->logInt64Value(DefaultDecisionPos, &Event.DefaultDecision);
*fe6060f1SDimitry Andric  L->logInt64Value(DecisionPos, &Event.AdvisedDecision);
e8d8bef9SDimitry Andric  if (InlineSizeEstimatorAnalysis::isEvaluatorRequested())
*fe6060f1SDimitry Andric    L->logInt64Reward(Event.Reward);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  // For debugging / later use
e8d8bef9SDimitry Andric  Effects.push_back(Event.Effect);
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricvoid TrainingLogger::print() {
e8d8bef9SDimitry Andric  std::error_code EC;
e8d8bef9SDimitry Andric  raw_fd_ostream OutFile(LogFileName, EC);
e8d8bef9SDimitry Andric  L->print(OutFile);
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricDevelopmentModeMLInlineAdvisor::DevelopmentModeMLInlineAdvisor(
e8d8bef9SDimitry Andric    Module &M, ModuleAnalysisManager &MAM,
e8d8bef9SDimitry Andric    std::unique_ptr<MLModelRunner> ModelRunner,
e8d8bef9SDimitry Andric    std::function<bool(CallBase &)> GetDefaultAdvice, bool IsDoingInference,
e8d8bef9SDimitry Andric    std::unique_ptr<TrainingLogger> Logger)
e8d8bef9SDimitry Andric    : MLInlineAdvisor(M, MAM, std::move(ModelRunner)),
e8d8bef9SDimitry Andric      GetDefaultAdvice(GetDefaultAdvice), IsDoingInference(IsDoingInference),
e8d8bef9SDimitry Andric      Logger(std::move(Logger)),
e8d8bef9SDimitry Andric      InitialNativeSize(isLogging() ? getTotalSizeEstimate() : 0),
e8d8bef9SDimitry Andric      CurrentNativeSize(InitialNativeSize) {
e8d8bef9SDimitry Andric  // We cannot have the case of neither inference nor logging.
e8d8bef9SDimitry Andric  assert(IsDoingInference || isLogging());
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricDevelopmentModeMLInlineAdvisor::~DevelopmentModeMLInlineAdvisor() {
e8d8bef9SDimitry Andric  if (isLogging())
e8d8bef9SDimitry Andric    Logger->print();
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricOptional<size_t>
e8d8bef9SDimitry AndricDevelopmentModeMLInlineAdvisor::getNativeSizeEstimate(const Function &F) const {
e8d8bef9SDimitry Andric  if (!InlineSizeEstimatorAnalysis::isEvaluatorRequested())
e8d8bef9SDimitry Andric    return None;
e8d8bef9SDimitry Andric  auto &R =
e8d8bef9SDimitry Andric      FAM.getResult<InlineSizeEstimatorAnalysis>(const_cast<Function &>(F));
e8d8bef9SDimitry Andric  if (!R) {
e8d8bef9SDimitry Andric    F.getParent()->getContext().emitError(
e8d8bef9SDimitry Andric        "Native size estimator is not present.");
e8d8bef9SDimitry Andric    return 0;
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric  return *R;
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstd::unique_ptr<MLInlineAdvice>
e8d8bef9SDimitry AndricDevelopmentModeMLInlineAdvisor::getMandatoryAdviceImpl(CallBase &CB) {
e8d8bef9SDimitry Andric  return std::make_unique<LoggingMLInlineAdvice>(
e8d8bef9SDimitry Andric      /*Advisor=*/this,
e8d8bef9SDimitry Andric      /*CB=*/CB, /*ORE=*/getCallerORE(CB), /*Recommendation=*/true,
e8d8bef9SDimitry Andric      /*Logger=*/*Logger,
e8d8bef9SDimitry Andric      /*CallerSizeEstimateBefore=*/getNativeSizeEstimate(*CB.getCaller()),
e8d8bef9SDimitry Andric      /*CalleeSizeEstimateBefore=*/
e8d8bef9SDimitry Andric      getNativeSizeEstimate(*CB.getCalledFunction()),
e8d8bef9SDimitry Andric      /*DefaultDecision=*/true, /*Mandatory*/ true);
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstd::unique_ptr<MLInlineAdvice>
e8d8bef9SDimitry AndricDevelopmentModeMLInlineAdvisor::getAdviceFromModel(
e8d8bef9SDimitry Andric    CallBase &CB, OptimizationRemarkEmitter &ORE) {
e8d8bef9SDimitry Andric  if (IsDoingInference && !isLogging())
e8d8bef9SDimitry Andric    return MLInlineAdvisor::getAdviceFromModel(CB, ORE);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  bool DefaultAdvice = GetDefaultAdvice(CB);
e8d8bef9SDimitry Andric  auto Recommendation = IsDoingInference ? ModelRunner->run() : DefaultAdvice;
e8d8bef9SDimitry Andric  return std::make_unique<LoggingMLInlineAdvice>(
e8d8bef9SDimitry Andric      /*Advisor=*/this,
e8d8bef9SDimitry Andric      /*CB=*/CB, /*ORE=*/ORE, /*Recommendation=*/Recommendation,
e8d8bef9SDimitry Andric      /*Logger=*/*Logger,
e8d8bef9SDimitry Andric      /*CallerSizeEstimateBefore=*/getNativeSizeEstimate(*CB.getCaller()),
e8d8bef9SDimitry Andric      /*CalleeSizeEstimateBefore=*/
e8d8bef9SDimitry Andric      getNativeSizeEstimate(*CB.getCalledFunction()),
e8d8bef9SDimitry Andric      /*DefaultDecision=*/DefaultAdvice);
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricsize_t DevelopmentModeMLInlineAdvisor::getTotalSizeEstimate() {
e8d8bef9SDimitry Andric  if (!InlineSizeEstimatorAnalysis::isEvaluatorRequested())
e8d8bef9SDimitry Andric    return 0;
e8d8bef9SDimitry Andric  size_t Ret = 0;
e8d8bef9SDimitry Andric  for (auto &F : M) {
e8d8bef9SDimitry Andric    if (F.isDeclaration())
e8d8bef9SDimitry Andric      continue;
e8d8bef9SDimitry Andric    if (isFunctionDeleted(&F))
e8d8bef9SDimitry Andric      continue;
e8d8bef9SDimitry Andric    Ret += *getNativeSizeEstimate(F);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric  return Ret;
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry AndricModelUnderTrainingRunner::ModelUnderTrainingRunner(LLVMContext &Ctx,
e8d8bef9SDimitry Andric                                                   const std::string &ModelPath)
e8d8bef9SDimitry Andric    : MLModelRunner(Ctx) {
e8d8bef9SDimitry Andric  std::vector<TensorSpec> InputSpecs;
e8d8bef9SDimitry Andric  for (size_t I = 0; I < NumberOfFeatures; ++I)
e8d8bef9SDimitry Andric    InputSpecs.push_back(
e8d8bef9SDimitry Andric        TensorSpec::createSpec<int64_t>(TFFeedPrefix + FeatureNameMap[I], {1}));
e8d8bef9SDimitry Andric  append_range(InputSpecs, TrainingOnlyFeatures);
e8d8bef9SDimitry Andric  if (auto MaybeOutSpecs =
e8d8bef9SDimitry Andric          loadOutputSpecs(Ctx, DecisionName, ModelPath, TFOutputSpecOverride))
e8d8bef9SDimitry Andric    OutputSpecs = std::move(*MaybeOutSpecs);
e8d8bef9SDimitry Andric  else
e8d8bef9SDimitry Andric    return;
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  Evaluator = std::make_unique<TFModelEvaluator>(
e8d8bef9SDimitry Andric      ModelPath, InputSpecs, [&](size_t I) { return OutputSpecs[I].Spec; },
e8d8bef9SDimitry Andric      OutputSpecs.size());
e8d8bef9SDimitry Andric  if (!Evaluator || !Evaluator->isValid()) {
e8d8bef9SDimitry Andric    Ctx.emitError("Failed to create inliner saved model evaluator");
e8d8bef9SDimitry Andric    Evaluator.reset();
e8d8bef9SDimitry Andric    return;
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricbool ModelUnderTrainingRunner::run() {
e8d8bef9SDimitry Andric  LastEvaluationResult = Evaluator->evaluate();
e8d8bef9SDimitry Andric  if (!LastEvaluationResult.hasValue()) {
e8d8bef9SDimitry Andric    Ctx.emitError("Error evaluating model.");
e8d8bef9SDimitry Andric    return false;
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric  int64_t Decision = *LastEvaluationResult->getTensorValue<int64_t>(0);
e8d8bef9SDimitry Andric  return static_cast<bool>(Decision);
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricint64_t ModelUnderTrainingRunner::getFeature(int Index) const {
e8d8bef9SDimitry Andric  return *Evaluator->getInput<int64_t>(Index);
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricvoid ModelUnderTrainingRunner::setFeature(FeatureIndex Index, int64_t Value) {
e8d8bef9SDimitry Andric  size_t NumericIndex = static_cast<size_t>(Index);
e8d8bef9SDimitry Andric  *(Evaluator->getInput<int64_t>(NumericIndex)) = Value;
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andricstd::unique_ptr<InlineAdvisor> llvm::getDevelopmentModeAdvisor(
e8d8bef9SDimitry Andric    Module &M, ModuleAnalysisManager &MAM,
e8d8bef9SDimitry Andric    std::function<bool(CallBase &)> GetDefaultAdvice) {
e8d8bef9SDimitry Andric  auto &Ctx = M.getContext();
e8d8bef9SDimitry Andric  std::unique_ptr<MLModelRunner> Runner;
e8d8bef9SDimitry Andric  ModelUnderTrainingRunner *MUTRPtr = nullptr;
e8d8bef9SDimitry Andric  bool IsDoingInference = false;
e8d8bef9SDimitry Andric  if (TFModelUnderTrainingPath.empty())
e8d8bef9SDimitry Andric    Runner.reset(new NoInferenceModelRunner(Ctx));
e8d8bef9SDimitry Andric  else {
e8d8bef9SDimitry Andric    auto MUTR = std::make_unique<ModelUnderTrainingRunner>(
e8d8bef9SDimitry Andric        Ctx, TFModelUnderTrainingPath);
e8d8bef9SDimitry Andric    if (!MUTR || !MUTR->isValid()) {
e8d8bef9SDimitry Andric      Ctx.emitError("Could not load the policy model from the provided path");
e8d8bef9SDimitry Andric      return nullptr;
e8d8bef9SDimitry Andric    }
e8d8bef9SDimitry Andric    IsDoingInference = true;
e8d8bef9SDimitry Andric    MUTRPtr = MUTR.get();
e8d8bef9SDimitry Andric    Runner = std::move(MUTR);
e8d8bef9SDimitry Andric  }
e8d8bef9SDimitry Andric  std::unique_ptr<TrainingLogger> Logger;
e8d8bef9SDimitry Andric  if (!TrainingLog.empty())
e8d8bef9SDimitry Andric    Logger = std::make_unique<TrainingLogger>(TrainingLog, MUTRPtr);
e8d8bef9SDimitry Andric
e8d8bef9SDimitry Andric  return std::make_unique<DevelopmentModeMLInlineAdvisor>(
e8d8bef9SDimitry Andric      M, MAM, std::move(Runner), GetDefaultAdvice, IsDoingInference,
e8d8bef9SDimitry Andric      std::move(Logger));
e8d8bef9SDimitry Andric}
e8d8bef9SDimitry Andric#endif // defined(LLVM_HAVE_TF_API)