runtime/onert/core/src/exec/train/TrainableExecutor.h


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109

/*
 * Copyright (c) 2023 Samsung Electronics Co., Ltd. All Rights Reserved
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#ifndef __ONERT_EXEC_TRAIN_TRAINABLE_EXECUTOR_H_
#define __ONERT_EXEC_TRAIN_TRAINABLE_EXECUTOR_H_

#include "exec/IExecutor.h"

#include "../ExecutionObservee.h"
#include "../../compiler/train/TensorRegistries.h"

#include "backend/train/TrainableBackendContext.h"
#include "compiler/train/TrainableCodeMap.h"
#include "compiler/train/LoweredTrainableGraph.h"
#include "ir/Index.h"
#include "util/TracingCtx.h"

namespace onert
{
namespace exec
{
namespace train
{

class TrainableExecutor : public IExecutor
{
public:
  /**
   * @brief Construct a new TrainableExecutor object
   * @param lowered_graph LoweredTrainableGraph object
   * @param tensor_builders Tensor builders that are currently used
   * @param code_map @c ir::Operation and its code map
   */
  TrainableExecutor(std::unique_ptr<compiler::train::LoweredTrainableGraph> lowered_graph,
                    backend::train::TrainableBackendContexts &&backend_contexts,
                    const compiler::train::TensorRegistries &tensor_regs,
                    compiler::train::TrainableCodeMap &&code_map,
                    const std::vector<ir::OperationIndex> &order,
                    const util::TracingCtx *tracing_ctx);

public:
  const ir::Graph &graph() const final { return _trainable_graph.graph(); }

  void execute(const IODescription &desc) override { forward(desc, false); };

  void execute(const std::vector<backend::IPortableTensor *> &inputs,
               const std::vector<backend::IPortableTensor *> &outputs) override;

  void forward(const IODescription &desc, bool training);
  void backward(const IODescription &desc, uint32_t training_step);

  // Used only in Dataflow and Parallel Executors
  void setIndexedRanks(std::shared_ptr<ir::OperationIndexMap<int64_t>> ranks) final
  {
    _indexed_ranks = std::move(ranks);
  };

  void addObserver(std::unique_ptr<IExecutionObserver> ref) { _subject.add(std::move(ref)); };

  const std::vector<backend::builtin::IOTensor *> &getInputTensors() const override
  {
    return _input_tensors;
  }

  const std::vector<backend::builtin::IOTensor *> &getOutputTensors() const override
  {
    return _output_tensors;
  }

  float getLoss(const ir::IOIndex &pred_io_ind) const;

  backend::train::TrainableBackendContexts &getBackendContexts() { return _backend_contexts; }

private:
  void forwardImpl(bool training);
  void backwardImpl(uint32_t training_step);

private:
  std::vector<compiler::train::TrainableCodeAndInfo> _code;
  ExecutionObservee _subject;
  std::shared_ptr<ir::OperationIndexMap<int64_t>> _indexed_ranks;
  std::unique_ptr<compiler::train::LoweredTrainableGraph> _lowered_graph;
  backend::train::TrainableBackendContexts _backend_contexts;
  const ir::train::TrainableGraph &_trainable_graph;
  compiler::train::TensorRegistries _tensor_regs;
  std::vector<backend::builtin::IOTensor *> _input_tensors;
  std::vector<backend::builtin::IOTensor *> _output_tensors;
  std::mutex _mutex;
  const util::TracingCtx *_tracing_ctx;
};

} // namespace train
} // namespace exec
} // namespace onert

#endif // __ONERT_EXEC_TRAIN_TRAINABLE_EXECUTOR_H_