runtime/onert/core/src/backend/controlflow/kernel/IfLayer.cc


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128

/*
 * Copyright (c) 2020 Samsung Electronics Co., Ltd. All Rights Reserved
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include "IfLayer.h"

#include <backend/ITensor.h>
#include "exec/ExecutorBase.h"
#include <misc/polymorphic_downcast.h>
#include "PermuteLayer.h"

namespace onert
{
namespace backend
{
namespace controlflow
{
namespace kernel
{

IfLayer::IfLayer(const std::shared_ptr<backend::ITensor> &cond_tensor,
                 const std::vector<std::shared_ptr<backend::ITensor>> input_tensors,
                 const std::vector<std::shared_ptr<backend::ITensor>> output_tensors,
                 const ir::OperandIndexSequence &output_indices, const ir::Graph &graph,
                 const exec::DynAllocInfoMap &outputs_dyn_alloc_info,
                 const ir::SubgraphIndex &then_subg_index, const ir::SubgraphIndex &else_subg_index,
                 exec::ExecutorMap *executor_map)
    : _cond_tensor{cond_tensor}, _input_tensors{input_tensors}, _output_tensors{output_tensors},
      _output_indices{output_indices}, _graph{graph},
      _outputs_dyn_alloc_info{outputs_dyn_alloc_info}, _then_subg_index{then_subg_index},
      _else_subg_index{else_subg_index}, _executor_map{executor_map}
{
  // At this point, executor_map may not have executors of then subg and else subg
}

void IfLayer::run()
{
  // Check condition
  // // If true
  // // // Copy _input_tensors -> then subg's inputs
  // // // Run then subg
  // // // Copy outputs of then subg -> _output_tensors
  // // Else
  // // // Copy _input_tensors -> else subg's inputs if false
  // // // Run else subg
  // // // Copy outputs of else subg -> _output_tensors
  auto getResultCond = [](backend::ITensor *tensor) -> bool {
    bool ret = false;
    tensor->access([&](ITensor &tensor) { ret = *reinterpret_cast<bool *>(tensor.buffer()); });
    return ret;
  };

  exec::ExecutorBase *subg_exec = nullptr;
  if (getResultCond(_cond_tensor.get()))
  {
    subg_exec = nnfw::misc::polymorphic_downcast<exec::ExecutorBase *>(
        _executor_map->at(_then_subg_index).get());
  }
  else
  {
    subg_exec = nnfw::misc::polymorphic_downcast<exec::ExecutorBase *>(
        _executor_map->at(_else_subg_index).get());
  }

  const auto &subg_graph = subg_exec->graph();

  std::vector<std::shared_ptr<backend::ITensor>> src_tensors;
  std::vector<std::shared_ptr<backend::ITensor>> dst_tensors;
  // Add tensors used in subgraph or contained in outputs of subgraph
  assert(subg_graph.getInputs().size() == _input_tensors.size());
  assert(subg_graph.getInputs().size() == subg_exec->getInputTensors().size());
  for (uint32_t i = 0; i < subg_graph.getInputs().size(); ++i)
  {
    const auto &subg_input_index = subg_graph.getInputs().at(i);
    const auto &subg_input = subg_graph.operands().at(subg_input_index);
    if (subg_input.getUses().size() > 0 || subg_graph.getOutputs().contains(subg_input_index))
    {
      src_tensors.emplace_back(_input_tensors.at(i));
      dst_tensors.emplace_back(subg_exec->getInputTensors().at(i));
    }
  }
  const auto &subg_inputs_dyn_alloc_info = subg_exec->getInputsDynamicAllocInfo();
  const auto permute_op_input_to_subg_input =
      std::make_shared<PermuteLayer>(src_tensors, dst_tensors, subg_inputs_dyn_alloc_info);

  // Add tensors used as output of operation or contained in outputs of operation
  src_tensors.clear();
  dst_tensors.clear();
  assert(_output_indices.size() == subg_exec->getOutputTensors().size());
  assert(_output_indices.size() == _output_tensors.size());
  for (uint32_t i = 0; i < _output_indices.size(); ++i)
  {
    const auto &output_index = _output_indices.at(i);
    const auto &output = _graph.operands().at(output_index);
    if (output.getUses().size() > 0 || _graph.getOutputs().contains(output_index))
    {
      src_tensors.emplace_back(subg_exec->getOutputTensors().at(i));
      dst_tensors.emplace_back(_output_tensors.at(i));
    }
  }
  const auto permute_subg_output_to_op_output =
      std::make_shared<PermuteLayer>(src_tensors, dst_tensors, _outputs_dyn_alloc_info);

  // Remove copying of unused tensor
  permute_op_input_to_subg_input->prepare();
  permute_subg_output_to_op_output->prepare();

  // Copy & run
  subg_exec->execute(_input_tensors, permute_op_input_to_subg_input);
  permute_subg_output_to_op_output->run();
}

} // namespace kernel
} // namespace controlflow
} // namespace backend
} // namespace onert