CoCalc -- DevelopmentModeInlineAdvisor.cpp

GitHub Repository: freebsd/freebsd-src
Path: blob/main/contrib/llvm-project/llvm/lib/Analysis/DevelopmentModeInlineAdvisor.cpp
³⁵²³³ views
1
//===- DevelopmentModeInlineAdvisor.cpp - runtime-loadable model runner  --===//
2
//
3
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4
// See https://llvm.org/LICENSE.txt for license information.
5
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6
//
7
//===----------------------------------------------------------------------===//
8
//
9
// This file implements a model runner using TFLite, allowing the
10
// loading of a model from a command line option.
11
//
12
//===----------------------------------------------------------------------===//
13
#include "llvm/Analysis/TensorSpec.h"
14
#include "llvm/Config/config.h"
15
#if defined(LLVM_HAVE_TFLITE)
16

17
#include "llvm/ADT/BitVector.h"
18
#include "llvm/Analysis/CallGraph.h"
19
#include "llvm/Analysis/InlineSizeEstimatorAnalysis.h"
20
#include "llvm/Analysis/MLInlineAdvisor.h"
21
#include "llvm/Analysis/ModelUnderTrainingRunner.h"
22
#include "llvm/Analysis/NoInferenceModelRunner.h"
23
#include "llvm/Analysis/Utils/TFUtils.h"
24
#include "llvm/Analysis/Utils/TrainingLogger.h"
25
#include "llvm/IR/LLVMContext.h"
26
#include "llvm/IR/Module.h"
27
#include "llvm/Support/CommandLine.h"
28
#include "llvm/Support/ManagedStatic.h"
29

30
#include <vector>
31
#include <optional>
32

33
using namespace llvm;
34

35
static cl::opt<std::string> TrainingLog(
36
    "training-log", cl::Hidden,
37
    cl::desc("Path where the development - mode inlining log is saved."));
38

39
static cl::opt<std::string> TFModelUnderTrainingPath(
40
    "ml-inliner-model-under-training", cl::Hidden,
41
    cl::desc(R"(Path to SavedModel from the previous training iteration.
42
The directory is also expected to contain a JSON specification of the 
43
outputs expected to be logged, where the first entry must be the 
44
inlining decision. The file containing the specification should be 
45
called output_spec.json. The expected JSON value is an array of 
46
dictionaries. Each dictionary should have 2 keys: 
47

48
- "tensor_spec, followed by the TensorSpec description of the
49
output; and 
50
- "logging_name", a string indicating the name to use when
51
logging the output values. 
52

53
Example:
54
[
55
  {
56
    "logging_name" : "some_name", 
57
    "tensor_spec" : { 
58
      "name" : "model_name", 
59
      "port" : 0,
60
      "shape" : [2, 3],
61
      "type" : "float"
62
      }
63
  }
64
]
65

66
The first value must always correspond to the decision.)"));
67

68
static cl::opt<std::string> TFOutputSpecOverride(
69
    "ml-inliner-output-spec-override", cl::Hidden,
70
    cl::desc("Override the path to the output spec json file. See "
71
             "-ml-inliner-model-under-training documentation for the "
72
             "specification of that file."));
73

74
static cl::opt<std::string> TFFeedPrefix("ml-inliner-trained-model-feed-prefix",
75
                                         cl::Hidden, cl::init("action_"),
76
                                         cl::desc("Prefix for feature names."));
77

78
namespace {
79
/// An InlineEvent, used by TrainingLogger.
80
struct InlineEvent {
81
  /// What the default policy's decision would have been.
82
  int64_t DefaultDecision = 0;
83

84
  /// What we advised. When training off the default policy, this is the same as
85
  /// DefaultDecision.
86
  int64_t AdvisedDecision = 0;
87

88
  /// What actually happened. This would be 'false' in the case of an inline
89
  /// error, even if AdvisedDecision were true, otherwise it agrees with
90
  /// AdvisedDecision.
91
  bool Effect = false;
92

93
  /// What the change in size was: size_after - size_before
94
  int64_t Reward = 0;
95
};
96

97
/// Collect data we may use for training a model.
98
class TrainingLogger final {
99
public:
100
  TrainingLogger(StringRef LogFileName, const ModelUnderTrainingRunner *MUTR);
101

102
  /// Log one inlining event.
103
  void logInlineEvent(const InlineEvent &Event,
104
                      const MLModelRunner &ModelRunner);
105

106
private:
107
  StringRef LogFileName;
108
  const ModelUnderTrainingRunner *const MUTR;
109
  std::unique_ptr<Logger> L;
110
  BitVector Effects;
111
  /// Set these 2 clearly OOB, to make sure we set them later.
112
  size_t DefaultDecisionPos = std::numeric_limits<size_t>::max();
113
  size_t DecisionPos = std::numeric_limits<size_t>::max();
114
};
115

116
/// An extension of the MLInlineAdvisor for the 'development' mode, targeting
117
/// the offline training scenario. Note that training happens outside of the
118
/// compiler, this facility is concerned with producing training data ("logs").
119
/// This InlineAdvisor can operate in the following modes:
120
///
121
/// 1) collect logs for the default policy. This is useful for bootstrapping
122
/// training, which will be considerably faster by starting from a reasonable
123
/// policy.
124
///
125
/// 2) collect logs for the ML policy, using a model from a previous
126
/// training. Potentially, that model uses internally some small random
127
/// perturbation of its weights, to induce exploration (setting this up is the
128
/// responsibility of the training algorithm). The logs would then be used to
129
/// retrain and improve on this model.
130
///
131
/// 3) use the provided model, with no logging. This is useful for end to end
132
/// validation - the model, in this case, is a release candidate and shouldn't
133
/// have random perturbations. It is a convenience feature: rather than needing
134
/// to take the release candidate model and compile it in 'release' mode,
135
/// validate it, then potentially discard it, it's easier to just pass the model
136
/// to the compiler, albeit compilation would be slower, as a one-off. Once the
137
/// model behaves satisfactorily, it can be compiled AOT, for efficiency, in
138
/// release mode. The expectation is that a well-trained model provides a good
139
/// policy over a sufficiently diverse codebase, over many changes (i.e.
140
/// training happens seldom).
141
class DevelopmentModeMLInlineAdvisor : public MLInlineAdvisor {
142
public:
143
  DevelopmentModeMLInlineAdvisor(
144
      Module &M, ModuleAnalysisManager &MAM,
145
      std::unique_ptr<MLModelRunner> ModelRunner,
146
      std::function<bool(CallBase &)> GetDefaultAdvice,
147
      std::unique_ptr<TrainingLogger> Logger);
148

149
  size_t getTotalSizeEstimate();
150

151
  void updateNativeSizeEstimate(int64_t Change) {
152
    *CurrentNativeSize += Change;
153
  }
154
  void resetNativeSize(Function *F) {
155
    PreservedAnalyses PA = PreservedAnalyses::all();
156
    PA.abandon<InlineSizeEstimatorAnalysis>();
157
    FAM.invalidate(*F, PA);
158
  }
159

160
  std::unique_ptr<MLInlineAdvice>
161
  getAdviceFromModel(CallBase &CB, OptimizationRemarkEmitter &ORE) override;
162

163
  std::optional<size_t> getNativeSizeEstimate(const Function &F) const;
164

165
private:
166
  bool isLogging() const { return !!Logger; }
167
  std::unique_ptr<MLInlineAdvice> getMandatoryAdviceImpl(CallBase &CB) override;
168

169
  const bool IsDoingInference;
170
  std::unique_ptr<TrainingLogger> Logger;
171

172
  const std::optional<int32_t> InitialNativeSize;
173
  std::optional<int32_t> CurrentNativeSize;
174
};
175

176
/// A variant of MLInlineAdvice that tracks all non-trivial inlining
177
/// decisions, for training/logging.
178
class LoggingMLInlineAdvice : public MLInlineAdvice {
179
public:
180
  LoggingMLInlineAdvice(DevelopmentModeMLInlineAdvisor *Advisor, CallBase &CB,
181
                        OptimizationRemarkEmitter &ORE, bool Recommendation,
182
                        TrainingLogger &Logger,
183
                        std::optional<size_t> CallerSizeEstimateBefore,
184
                        std::optional<size_t> CalleeSizeEstimateBefore,
185
                        bool DefaultDecision, bool Mandatory = false)
186
      : MLInlineAdvice(Advisor, CB, ORE, Recommendation), Logger(Logger),
187
        CallerSizeEstimateBefore(CallerSizeEstimateBefore),
188
        CalleeSizeEstimateBefore(CalleeSizeEstimateBefore),
189
        DefaultDecision(DefaultDecision), Mandatory(Mandatory) {}
190

191
  virtual ~LoggingMLInlineAdvice() = default;
192

193
private:
194
  DevelopmentModeMLInlineAdvisor *getAdvisor() const {
195
    return static_cast<DevelopmentModeMLInlineAdvisor *>(Advisor);
196
  }
197
  void recordInliningImpl() override {
198
    MLInlineAdvice::recordInliningImpl();
199
    getAdvisor()->resetNativeSize(Caller);
200
    int Reward = std::numeric_limits<int>::max();
201
    if (InlineSizeEstimatorAnalysis::isEvaluatorRequested() &&
202
        !getAdvisor()->isForcedToStop()) {
203
      int NativeSizeAfter = *getAdvisor()->getNativeSizeEstimate(*Caller) +
204
                            *CalleeSizeEstimateBefore;
205
      Reward = NativeSizeAfter -
206
               (*CallerSizeEstimateBefore + *CalleeSizeEstimateBefore);
207
      getAdvisor()->updateNativeSizeEstimate(Reward);
208
    }
209
    log(Reward, /*Success=*/true);
210
  }
211

212
  void recordInliningWithCalleeDeletedImpl() override {
213
    MLInlineAdvice::recordInliningWithCalleeDeletedImpl();
214
    getAdvisor()->resetNativeSize(Caller);
215
    if (InlineSizeEstimatorAnalysis::isEvaluatorRequested() &&
216
        !getAdvisor()->isForcedToStop()) {
217
      int NativeSizeAfter = *getAdvisor()->getNativeSizeEstimate(*Caller);
218
      int Reward = NativeSizeAfter -
219
                   (*CallerSizeEstimateBefore + *CalleeSizeEstimateBefore);
220
      getAdvisor()->updateNativeSizeEstimate(Reward);
221
      log(Reward, /*Success=*/true);
222
    } else {
223
      log(NoReward, /*Success=*/true);
224
    }
225
  }
226

227
  void recordUnsuccessfulInliningImpl(const InlineResult &Result) override {
228
    MLInlineAdvice::recordUnsuccessfulInliningImpl(Result);
229
    log(NoReward, /*Success=*/false);
230
  }
231

232
  void recordUnattemptedInliningImpl() override {
233
    MLInlineAdvice::recordUnattemptedInliningImpl();
234
    log(NoReward, /*Success=*/false);
235
  }
236

237
  void log(int64_t Reward, bool Success) {
238
    if (Mandatory)
239
      return;
240
    InlineEvent Event;
241
    Event.AdvisedDecision = isInliningRecommended();
242
    Event.DefaultDecision = DefaultDecision;
243
    Event.Effect = Success;
244
    Event.Reward = Reward;
245
    Logger.logInlineEvent(Event, getAdvisor()->getModelRunner());
246
  }
247

248
  static const int64_t NoReward = 0;
249
  TrainingLogger &Logger;
250
  const std::optional<size_t> CallerSizeEstimateBefore;
251
  const std::optional<size_t> CalleeSizeEstimateBefore;
252
  const int64_t DefaultDecision;
253
  const int64_t Mandatory;
254
};
255

256
static const std::vector<TensorSpec> TrainingOnlyFeatures{
257
    TensorSpec::createSpec<float>(TFFeedPrefix + "discount", {1}),
258
    TensorSpec::createSpec<float>(TFFeedPrefix + "reward", {1}),
259
    TensorSpec::createSpec<int32_t>(TFFeedPrefix + "step_type", {1})};
260

261
static const std::vector<TensorSpec> getInputFeatures() {
262
  std::vector<TensorSpec> InputSpecs;
263
  for (size_t I = 0; I < NumberOfFeatures; ++I)
264
    InputSpecs.push_back(TensorSpec::createSpec<int64_t>(
265
        TFFeedPrefix + FeatureMap[I].name(), FeatureMap[I].shape()));
266
  append_range(InputSpecs, TrainingOnlyFeatures);
267
  return InputSpecs;
268
}
269

270
} // namespace
271

272
TrainingLogger::TrainingLogger(StringRef LogFileName,
273
                               const ModelUnderTrainingRunner *MUTR)
274
    : LogFileName(LogFileName), MUTR(MUTR) {
275
  // The first output is the inlining decision.
276
  std::vector<TensorSpec> FT(FeatureMap.begin(), FeatureMap.end());
277

278
  if (MUTR)
279
    append_range(FT, MUTR->extraOutputsForLoggingSpecs());
280

281
  DefaultDecisionPos = FT.size();
282
  FT.push_back(DefaultDecisionSpec);
283

284
  DecisionPos = FT.size();
285
  FT.push_back(InlineDecisionSpec);
286
  std::error_code EC;
287
  auto OS = std::make_unique<raw_fd_ostream>(TrainingLog, EC);
288
  if (EC)
289
    dbgs() << (EC.message() + ":" + TrainingLog);
290

291
  L = std::make_unique<Logger>(
292
      std::move(OS), FT, TensorSpec::createSpec<int64_t>(RewardName, {1}),
293
      InlineSizeEstimatorAnalysis::isEvaluatorRequested());
294
  L->switchContext("");
295
}
296

297
/// Log one inlining event.
298
void TrainingLogger::logInlineEvent(const InlineEvent &Event,
299
                                    const MLModelRunner &ModelRunner) {
300
  L->startObservation();
301
  size_t CurrentFeature = 0;
302
  for (; CurrentFeature < NumberOfFeatures; ++CurrentFeature)
303
    L->logTensorValue(CurrentFeature,
304
                      reinterpret_cast<const char *>(
305
                          ModelRunner.getTensorUntyped(CurrentFeature)));
306

307
  if (MUTR)
308
    for (size_t I = 0; I < MUTR->extraOutputsForLoggingSpecs().size(); ++I) {
309
      const char *RawData =
310
          reinterpret_cast<const char *>(MUTR->getUntypedExtraOutputValue(I));
311
      L->logTensorValue(CurrentFeature, RawData);
312
      ++CurrentFeature;
313
    }
314

315
  assert(CurrentFeature == DefaultDecisionPos);
316
  L->logTensorValue(DefaultDecisionPos,
317
                    reinterpret_cast<const char *>(&Event.DefaultDecision));
318
  L->logTensorValue(DecisionPos,
319
                    reinterpret_cast<const char *>(&Event.AdvisedDecision));
320
  L->endObservation();
321
  if (InlineSizeEstimatorAnalysis::isEvaluatorRequested())
322
    L->logReward(Event.Reward);
323

324
  // For debugging / later use
325
  Effects.push_back(Event.Effect);
326
}
327

328
DevelopmentModeMLInlineAdvisor::DevelopmentModeMLInlineAdvisor(
329
    Module &M, ModuleAnalysisManager &MAM,
330
    std::unique_ptr<MLModelRunner> ModelRunner,
331
    std::function<bool(CallBase &)> GetDefaultAdvice,
332
    std::unique_ptr<TrainingLogger> Logger)
333
    : MLInlineAdvisor(M, MAM, std::move(ModelRunner), GetDefaultAdvice),
334
      IsDoingInference(isa<ModelUnderTrainingRunner>(getModelRunner())),
335
      Logger(std::move(Logger)),
336
      InitialNativeSize(isLogging() ? getTotalSizeEstimate() : 0),
337
      CurrentNativeSize(InitialNativeSize) {
338
  // We cannot have the case of neither inference nor logging.
339
  assert(IsDoingInference || isLogging());
340
}
341

342
std::optional<size_t>
343
DevelopmentModeMLInlineAdvisor::getNativeSizeEstimate(const Function &F) const {
344
  if (!InlineSizeEstimatorAnalysis::isEvaluatorRequested())
345
    return std::nullopt;
346
  auto &R =
347
      FAM.getResult<InlineSizeEstimatorAnalysis>(const_cast<Function &>(F));
348
  if (!R) {
349
    F.getParent()->getContext().emitError(
350
        "Native size estimator is not present.");
351
    return 0;
352
  }
353
  return *R;
354
}
355

356
std::unique_ptr<MLInlineAdvice>
357
DevelopmentModeMLInlineAdvisor::getMandatoryAdviceImpl(CallBase &CB) {
358
  return std::make_unique<LoggingMLInlineAdvice>(
359
      /*Advisor=*/this,
360
      /*CB=*/CB, /*ORE=*/getCallerORE(CB), /*Recommendation=*/true,
361
      /*Logger=*/*Logger,
362
      /*CallerSizeEstimateBefore=*/getNativeSizeEstimate(*CB.getCaller()),
363
      /*CalleeSizeEstimateBefore=*/
364
      getNativeSizeEstimate(*CB.getCalledFunction()),
365
      /*DefaultDecision=*/true, /*Mandatory*/ true);
366
}
367

368
std::unique_ptr<MLInlineAdvice>
369
DevelopmentModeMLInlineAdvisor::getAdviceFromModel(
370
    CallBase &CB, OptimizationRemarkEmitter &ORE) {
371
  if (IsDoingInference && !isLogging())
372
    return MLInlineAdvisor::getAdviceFromModel(CB, ORE);
373

374
  bool DefaultAdvice = GetDefaultAdvice(CB);
375
  auto Recommendation =
376
      IsDoingInference ? static_cast<bool>(ModelRunner->evaluate<int64_t>())
377
                       : DefaultAdvice;
378
  return std::make_unique<LoggingMLInlineAdvice>(
379
      /*Advisor=*/this,
380
      /*CB=*/CB, /*ORE=*/ORE, /*Recommendation=*/Recommendation,
381
      /*Logger=*/*Logger,
382
      /*CallerSizeEstimateBefore=*/getNativeSizeEstimate(*CB.getCaller()),
383
      /*CalleeSizeEstimateBefore=*/
384
      getNativeSizeEstimate(*CB.getCalledFunction()),
385
      /*DefaultDecision=*/DefaultAdvice);
386
}
387

388
size_t DevelopmentModeMLInlineAdvisor::getTotalSizeEstimate() {
389
  if (!InlineSizeEstimatorAnalysis::isEvaluatorRequested())
390
    return 0;
391
  size_t Ret = 0;
392
  for (auto &F : M) {
393
    if (F.isDeclaration())
394
      continue;
395
    Ret += *getNativeSizeEstimate(F);
396
  }
397
  return Ret;
398
}
399

400
std::unique_ptr<InlineAdvisor> llvm::getDevelopmentModeAdvisor(
401
    Module &M, ModuleAnalysisManager &MAM,
402
    std::function<bool(CallBase &)> GetDefaultAdvice) {
403
  auto &Ctx = M.getContext();
404
  std::unique_ptr<MLModelRunner> Runner;
405
  if (TFModelUnderTrainingPath.empty())
406
    Runner.reset(new NoInferenceModelRunner(Ctx, getInputFeatures()));
407
  else
408
    Runner = ModelUnderTrainingRunner::createAndEnsureValid(
409
        Ctx, TFModelUnderTrainingPath, DecisionName, getInputFeatures(),
410
        TFOutputSpecOverride);
411
  if (!Runner)
412
    return nullptr;
413
  std::unique_ptr<TrainingLogger> Logger;
414
  if (!TrainingLog.empty())
415
    Logger = std::make_unique<TrainingLogger>(
416
        TrainingLog, dyn_cast<ModelUnderTrainingRunner>(Runner.get()));
417

418
  return std::make_unique<DevelopmentModeMLInlineAdvisor>(
419
      M, MAM, std::move(Runner), GetDefaultAdvice, std::move(Logger));
420
}
421
#endif // defined(LLVM_HAVE_TFLITE)
422

423
Product

Resources

Company