Details | Last modification | View Log | RSS feed
| Rev | Author | Line No. | Line | 
|---|---|---|---|
| 14 | pmbaty | 1 | //===- ReleaseModeModelRunner.h - Fast, precompiled model runner  ---------===// | 
| 2 | // | ||
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | ||
| 4 | // See https://llvm.org/LICENSE.txt for license information. | ||
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | ||
| 6 | // | ||
| 7 | //===----------------------------------------------------------------------===// | ||
| 8 | // | ||
| 9 | // This file implements a model runner wrapping an AOT compiled ML model. | ||
| 10 | // Only inference is supported. | ||
| 11 | // | ||
| 12 | //===----------------------------------------------------------------------===// | ||
| 13 | |||
| 14 | #ifndef LLVM_ANALYSIS_RELEASEMODEMODELRUNNER_H | ||
| 15 | #define LLVM_ANALYSIS_RELEASEMODEMODELRUNNER_H | ||
| 16 | |||
| 17 | #include "llvm/Analysis/MLModelRunner.h" | ||
| 18 | #include "llvm/Analysis/TensorSpec.h" | ||
| 19 | #include "llvm/Support/ErrorHandling.h" | ||
| 20 | |||
| 21 | #include <memory> | ||
| 22 | #include <vector> | ||
| 23 | |||
| 24 | namespace llvm { | ||
| 25 | |||
| 26 | /// ReleaseModeModelRunner - production mode implementation of the | ||
| 27 | /// MLModelRunner. It uses an AOT-compiled SavedModel for efficient execution. | ||
| 28 | template <class TGen> | ||
| 29 | class ReleaseModeModelRunner final : public MLModelRunner { | ||
| 30 | public: | ||
| 31 |   /// FeatureNames' type should be an indexed collection of std::string, like | ||
| 32 |   /// std::array or std::vector, that has a size() method. | ||
| 33 | template <class FType> | ||
| 34 | ReleaseModeModelRunner(LLVMContext &Ctx, const FType &InputSpec, | ||
| 35 | StringRef DecisionName, StringRef FeedPrefix = "feed_", | ||
| 36 | StringRef FetchPrefix = "fetch_") | ||
| 37 | : MLModelRunner(Ctx, MLModelRunner::Kind::Release, InputSpec.size()), | ||
| 38 | CompiledModel(std::make_unique<TGen>()) { | ||
| 39 | assert(CompiledModel && "The CompiledModel should be valid"); | ||
| 40 | |||
| 41 | for (size_t I = 0; I < InputSpec.size(); ++I) { | ||
| 42 | const int Index = | ||
| 43 | CompiledModel->LookupArgIndex(FeedPrefix.str() + InputSpec[I].name()); | ||
| 44 | void *Buffer = nullptr; | ||
| 45 | if (Index >= 0) | ||
| 46 | Buffer = CompiledModel->arg_data(Index); | ||
| 47 | setUpBufferForTensor(I, InputSpec[I], Buffer); | ||
| 48 |     } | ||
| 49 | |||
| 50 | ResultIndex = CompiledModel->LookupResultIndex(FetchPrefix.str() + | ||
| 51 | DecisionName.str()); | ||
| 52 | assert(ResultIndex >= 0 && "Cannot find DecisionName in inlining model"); | ||
| 53 |   } | ||
| 54 | |||
| 55 | virtual ~ReleaseModeModelRunner() = default; | ||
| 56 | |||
| 57 | static bool classof(const MLModelRunner *R) { | ||
| 58 | return R->getKind() == MLModelRunner::Kind::Release; | ||
| 59 |   } | ||
| 60 | |||
| 61 | private: | ||
| 62 | void *evaluateUntyped() override { | ||
| 63 | CompiledModel->Run(); | ||
| 64 | return CompiledModel->result_data(ResultIndex); | ||
| 65 |   } | ||
| 66 | |||
| 67 | int32_t ResultIndex = -1; | ||
| 68 | std::unique_ptr<TGen> CompiledModel; | ||
| 69 | }; | ||
| 70 | |||
| 71 | /// A mock class satisfying the interface expected by ReleaseModeModelRunner for | ||
| 72 | /// its `TGen` parameter. Useful to avoid conditional compilation complexity, as | ||
| 73 | /// a compile-time replacement for a real AOT-ed model. | ||
| 74 | class NoopSavedModelImpl final { | ||
| 75 | #define NOOP_MODEL_ERRMSG                                                      \ | ||
| 76 |   "The mock AOT-ed saved model is a compile-time stub and should not be "      \ | ||
| 77 |   "called." | ||
| 78 | |||
| 79 | public: | ||
| 80 | NoopSavedModelImpl() = default; | ||
| 81 | int LookupArgIndex(const std::string &) { llvm_unreachable(NOOP_MODEL_ERRMSG); } | ||
| 82 | int LookupResultIndex(const std::string &) { llvm_unreachable(NOOP_MODEL_ERRMSG); } | ||
| 83 | void Run() { llvm_unreachable(NOOP_MODEL_ERRMSG); } | ||
| 84 | void *result_data(int) { llvm_unreachable(NOOP_MODEL_ERRMSG); } | ||
| 85 | void *arg_data(int) { llvm_unreachable(NOOP_MODEL_ERRMSG); } | ||
| 86 | #undef NOOP_MODEL_ERRMSG | ||
| 87 | }; | ||
| 88 | } // namespace llvm | ||
| 89 | |||
| 90 | #endif // LLVM_ANALYSIS_RELEASEMODEMODELRUNNER_H |