summaryrefslogtreecommitdiff
path: root/runtimes/neurun/src/kernel/acl_cl/TensorConvertToCommonLayer.cc
blob: 985524bc3f5dfd9a42557abc56cf5b5a837df9c1 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
/*
 * Copyright (c) 2018 Samsung Electronics Co., Ltd. All Rights Reserved
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

//
// THIS FILE IS UNUSED BUT LEFT FOR FUTURE REFERNCE
//

#if 0

#include "TensorConvertToCommonLayer.h"

#include "backend/acl_cl/feature/View.h"
#include "internal/nnapi/feature/View.h"

#include <util/feature/IndexIterator.h>
#include <arm_compute/runtime/CL/CLScheduler.h>

namespace neurun
{
namespace kernel
{
namespace acl_cl
{

bool TensorConvertToCommonLayer::convert()
{
  auto outputBuffer = _outputTensor->buffer();
  auto outputSize = _outputTensor->info()->total_size();

  auto &queue = ::arm_compute::CLScheduler::get().queue();

  _inputTensor->map(queue);

  if (_tensorShape.rank() == 2)
  {
    const auto len = _tensorShape.dim(1);

    auto base = reinterpret_cast<float *>(outputBuffer);

    for (int32_t n = 0; n < len; ++n)
    {
      auto from = reinterpret_cast<const float *>(
          _inputTensor->ptr_to_element(::arm_compute::Coordinates{n}));
      auto into = base + n;

      *into = *from;
    }
  }
  else if (_tensorShape.rank() == 4)
  {
    auto featureShape = _tensorShape.asFeature();

    const ::internal::arm_compute::feature::View<float> from{_inputTensor};
    ::internal::nnapi::feature::View<float> into{featureShape, outputBuffer, outputSize};

    ::nnfw::util::feature::iterate(featureShape)
        << [&](uint32_t batch, uint32_t ch, uint32_t row, uint32_t col) {
             const auto value = from.at(batch, ch, row, col);
             into.at(batch, ch, row, col) = value;
           };
  }

  _inputTensor->unmap(queue);
}

void TensorConvertToCommonLayer::configure(::arm_compute::ICLTensor *inputTensor,
                                           ::internal::common::Tensor *outputTensor,
                                           const ::neurun::graph::operand::Shape &tensorShape)
{
  _inputTensor = inputTensor;
  _outputTensor = outputTensor;
  _tensorShape = tensorShape;
}

void TensorConvertToCommonLayer::run() { convert(); }

} // namespace acl_cl
} // namespace kernel
} // namespace neurun

#endif