doxygen/ReleaseModeModelRunner_8h_source.html

//===- ReleaseModeModelRunner.h - Fast, precompiled model runner  ---------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements a model runner wrapping an AOT compiled ML model.

// Only inference is supported.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_ANALYSIS_RELEASEMODEMODELRUNNER_H

#define LLVM_ANALYSIS_RELEASEMODEMODELRUNNER_H


#include "llvm/ADT/StringExtras.h"

#include "llvm/Analysis/MLModelRunner.h"

#include "llvm/Analysis/TensorSpec.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/MD5.h"


#include <memory>


namespace llvm {


/// ReleaseModeModelRunner - production mode implementation of the

/// MLModelRunner. It uses an AOT-compiled SavedModel for efficient execution.

struct EmbeddedModelRunnerOptions {

  /// Feed and Fetch feature prefixes - i.e. a feature named "foo" will be

  /// looked up as {FeedPrefix}_foo; and the output named "bar" will be looked

  /// up as {FetchPrefix}_bar

  StringRef FeedPrefix = "feed_";

  StringRef FetchPrefix = "fetch_";


  /// ModelSelector is the name (recognized by the AOT-ed model) of a sub-model

  /// to use. "" is allowed if the model doesn't support sub-models.

  StringRef ModelSelector = "";


  EmbeddedModelRunnerOptions &setFeedPrefix(StringRef Value) {

    FeedPrefix = Value;

    return *this;

  }

  EmbeddedModelRunnerOptions &setFetchPrefix(StringRef Value) {

    FetchPrefix = Value;

    return *this;

  }

  EmbeddedModelRunnerOptions &setModelSelector(StringRef Value) {

    ModelSelector = Value;

    return *this;

  }

};


template <class TGen>

class ReleaseModeModelRunner final : public MLModelRunner {

public:

  /// FeatureNames' type should be an indexed collection of std::string, like

  /// std::array or std::vector, that has a size() method.

  template <class FType>

  ReleaseModeModelRunner(LLVMContext &Ctx, const FType &InputSpec,

                         StringRef DecisionName,

                         const EmbeddedModelRunnerOptions &Options = {})

      : MLModelRunner(Ctx, MLModelRunner::Kind::Release, InputSpec.size() + 1),

        CompiledModel(std::make_unique<TGen>()) {

    assert(CompiledModel && "The CompiledModel should be valid");

    // Set up the model_selector past all the InputSpecs in all cases.

    //   - if the model doesn't have such a feature, but the user requested it,

    //   we report error. Same if the model supports it but the user didn't

    //   specify it

    //   - finally, we compute the MD5 hash of the user input and set the value

    //   of the model selector to {high, low}

    bool InputIsPresent = true;

    populateTensor(InputSpec.size(),

                   TensorSpec::createSpec<uint64_t>("model_selector", {2}),

                   Options.FeedPrefix, InputIsPresent);


    // If we hit the "report an error" cases outlined above, continue with the

    // set up in case there's some custom diagnostics handler installed and it

    // doesn't promptly exit.

    if (Options.ModelSelector.empty() && InputIsPresent)

      Ctx.emitError(

          "A model selector was not specified but the underlying model "

          "requires selecting one because it exposes a model_selector input");

    uint64_t High = 0;

    uint64_t Low = 0;

    if (!Options.ModelSelector.empty()) {

      if (!InputIsPresent)

        Ctx.emitError("A model selector was specified but the underlying model "

                      "does not expose a model_selector input");

      const auto Hash = MD5::hash(arrayRefFromStringRef(Options.ModelSelector));

      High = Hash.high();

      Low = Hash.low();

    }

    getTensor<uint64_t>(InputSpec.size())[0] = High;

    getTensor<uint64_t>(InputSpec.size())[1] = Low;

    // At this point, the model selector is set up. If the user didn't provide

    // one, but the model has a model_selector, it'll be set to (0, 0) which

    // the composite model should treat as error as part of its implementation

    // (but that should only matter if there is a custom handler that doesn't

    // exit on error)

    for (size_t I = 0; I < InputSpec.size(); ++I)

      populateTensor(I, InputSpec[I], Options.FeedPrefix, InputIsPresent);


    ResultIndex = CompiledModel->LookupResultIndex(Options.FetchPrefix.str() +

                                                   DecisionName.str());

    assert(ResultIndex >= 0 && "Cannot find DecisionName in inlining model");

  }


  virtual ~ReleaseModeModelRunner() = default;


  static bool classof(const MLModelRunner *R) {

    return R->getKind() == MLModelRunner::Kind::Release;

  }


private:

  // fetch the model-provided buffer for the given Spec, or let MLModelRunner

  // create a scratch buffer. Indicate back to the caller if the model had that

  // input in the first place.

  void populateTensor(size_t Pos, const TensorSpec &Spec, StringRef Prefix,

                      bool &InputIsPresent) {

    const int Index =

        CompiledModel->LookupArgIndex((Prefix + Spec.name()).str());

    void *Buffer = nullptr;

    InputIsPresent = Index >= 0;

    if (InputIsPresent)

      Buffer = CompiledModel->arg_data(Index);

    setUpBufferForTensor(Pos, Spec, Buffer);

  }


  void *evaluateUntyped() override {

    CompiledModel->Run();

    return CompiledModel->result_data(ResultIndex);

  }


  int32_t ResultIndex = -1;

  std::unique_ptr<TGen> CompiledModel;

};


/// A mock class satisfying the interface expected by ReleaseModeModelRunner for

/// its `TGen` parameter. Useful to avoid conditional compilation complexity, as

/// a compile-time replacement for a real AOT-ed model.

class NoopSavedModelImpl final {

#define NOOP_MODEL_ERRMSG                                                      \

  "The mock AOT-ed saved model is a compile-time stub and should not be "      \

  "called."


public:

  NoopSavedModelImpl() = default;

  int LookupArgIndex(const std::string &) { llvm_unreachable(NOOP_MODEL_ERRMSG); }

  int LookupResultIndex(const std::string &) { llvm_unreachable(NOOP_MODEL_ERRMSG); }

  void Run() { llvm_unreachable(NOOP_MODEL_ERRMSG); }

  void *result_data(int) { llvm_unreachable(NOOP_MODEL_ERRMSG); }

  void *arg_data(int) { llvm_unreachable(NOOP_MODEL_ERRMSG); }

#undef NOOP_MODEL_ERRMSG

};


template <class T> bool isEmbeddedModelEvaluatorValid() { return true; }


template <> inline bool isEmbeddedModelEvaluatorValid<NoopSavedModelImpl>() {

  return false;

}

} // namespace llvm


#endif // LLVM_ANALYSIS_RELEASEMODEMODELRUNNER_H

Options
static LVOptions Options
Definition: LVOptions.cpp:25

I
#define I(x, y, z)
Definition: MD5.cpp:58

MD5.h

MLModelRunner.h

High
uint64_t High
Definition: NVVMIntrRange.cpp:52

NOOP_MODEL_ERRMSG
#define NOOP_MODEL_ERRMSG
Definition: ReleaseModeModelRunner.h:143

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

StringExtras.h
This file contains some functions that are useful when dealing with strings.

TensorSpec.h

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LLVMContext::emitError
void emitError(uint64_t LocCookie, const Twine &ErrorStr)
emitError - Emit an error message to the currently installed error handler with optional location inf...
Definition: LLVMContext.cpp:286

llvm::MD5::hash
static MD5Result hash(ArrayRef< uint8_t > Data)
Computes the hash for a given bytes.
Definition: MD5.cpp:291

llvm::MLModelRunner
MLModelRunner interface: abstraction of a mechanism for evaluating a ML model.
Definition: MLModelRunner.h:26

llvm::MLModelRunner::Kind::Release
@ Release

llvm::MLModelRunner::setUpBufferForTensor
void setUpBufferForTensor(size_t Index, const TensorSpec &Spec, void *Buffer)
Definition: MLModelRunner.h:63

llvm::MLModelRunner::Ctx
LLVMContext & Ctx
Definition: MLModelRunner.h:72

llvm::NoopSavedModelImpl
A mock class satisfying the interface expected by ReleaseModeModelRunner for its TGen parameter.
Definition: ReleaseModeModelRunner.h:142

llvm::NoopSavedModelImpl::LookupArgIndex
int LookupArgIndex(const std::string &)
Definition: ReleaseModeModelRunner.h:149

llvm::NoopSavedModelImpl::Run
void Run()
Definition: ReleaseModeModelRunner.h:151

llvm::NoopSavedModelImpl::arg_data
void * arg_data(int)
Definition: ReleaseModeModelRunner.h:153

llvm::NoopSavedModelImpl::result_data
void * result_data(int)
Definition: ReleaseModeModelRunner.h:152

llvm::NoopSavedModelImpl::NoopSavedModelImpl
NoopSavedModelImpl()=default

llvm::NoopSavedModelImpl::LookupResultIndex
int LookupResultIndex(const std::string &)
Definition: ReleaseModeModelRunner.h:150

llvm::ReleaseModeModelRunner
Definition: ReleaseModeModelRunner.h:55

llvm::ReleaseModeModelRunner::ReleaseModeModelRunner
ReleaseModeModelRunner(LLVMContext &Ctx, const FType &InputSpec, StringRef DecisionName, const EmbeddedModelRunnerOptions &Options={})
FeatureNames' type should be an indexed collection of std::string, like std::array or std::vector,...
Definition: ReleaseModeModelRunner.h:60

llvm::ReleaseModeModelRunner::classof
static bool classof(const MLModelRunner *R)
Definition: ReleaseModeModelRunner.h:111

llvm::ReleaseModeModelRunner::~ReleaseModeModelRunner
virtual ~ReleaseModeModelRunner()=default

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50

llvm::TensorSpec
Definition: TensorSpec.h:62

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

uint64_t

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::dwarf::Index
Index
Definition: Dwarf.h:875

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::ThreadPriority::Low
@ Low
Lower the current thread's priority such that it does not affect foreground tasks significantly.

llvm::isEmbeddedModelEvaluatorValid
bool isEmbeddedModelEvaluatorValid()
Definition: ReleaseModeModelRunner.h:157

llvm::isEmbeddedModelEvaluatorValid< NoopSavedModelImpl >
bool isEmbeddedModelEvaluatorValid< NoopSavedModelImpl >()
Definition: ReleaseModeModelRunner.h:159

llvm::DecisionName
const char *const DecisionName
Definition: MLInlineAdvisor.cpp:121

llvm::EmbeddedModelRunnerOptions
ReleaseModeModelRunner - production mode implementation of the MLModelRunner.
Definition: ReleaseModeModelRunner.h:29

llvm::EmbeddedModelRunnerOptions::FetchPrefix
StringRef FetchPrefix
Definition: ReleaseModeModelRunner.h:34

llvm::EmbeddedModelRunnerOptions::setFeedPrefix
EmbeddedModelRunnerOptions & setFeedPrefix(StringRef Value)
Definition: ReleaseModeModelRunner.h:40

llvm::EmbeddedModelRunnerOptions::FeedPrefix
StringRef FeedPrefix
Feed and Fetch feature prefixes - i.e.
Definition: ReleaseModeModelRunner.h:33

llvm::EmbeddedModelRunnerOptions::setModelSelector
EmbeddedModelRunnerOptions & setModelSelector(StringRef Value)
Definition: ReleaseModeModelRunner.h:48

llvm::EmbeddedModelRunnerOptions::ModelSelector
StringRef ModelSelector
ModelSelector is the name (recognized by the AOT-ed model) of a sub-model to use.
Definition: ReleaseModeModelRunner.h:38

llvm::EmbeddedModelRunnerOptions::setFetchPrefix
EmbeddedModelRunnerOptions & setFetchPrefix(StringRef Value)
Definition: ReleaseModeModelRunner.h:44

llvm::Spec
Definition: FunctionSpecialization.h:121