summaryrefslogtreecommitdiff
path: root/runtime/onert/core/src/exec/feature/nchw/Reader.h
blob: d5e3cb97cef73cbc670579d7f9c283397b0bda01 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
/*
 * Copyright (c) 2019 Samsung Electronics Co., Ltd. All Rights Reserved
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#ifndef __ONERT_EXEC_FEATURE_NCHW_READER_H__
#define __ONERT_EXEC_FEATURE_NCHW_READER_H__

#include "../Reader.h"

#include <cassert>

#include "backend/ITensor.h"
#include "ir/Shape.h"

namespace onert
{
namespace exec
{
namespace feature
{
namespace nchw
{

template <typename T> class Reader : public feature::Reader<T>
{
public:
  using Strides = ir::FeatureShape;
  // Construct for buffer and strides
  Reader(const ir::FeatureShape &shape, const Strides &strides, const T *ptr, size_t len)
    : _shape{shape}, _strides{strides}, _ptr{reinterpret_cast<const uint8_t *>(ptr)}, _len{len}
  {
    UNUSED_RELEASE(len); // Workaround for unused variable in release mode
    assert(len == static_cast<size_t>(strides.N != 0
                                        ? shape.N * strides.N
                                        : strides.C != 0 ? shape.C * strides.C
                                                         : strides.H != 0 ? shape.H * strides.H
                                                                          : shape.W * strides.W));
  }

  // Construct for backend tensor
  Reader(backend::ITensor *tensor)
    : _ptr{tensor->buffer() + tensor->calcOffset({0, 0, 0, 0})}, _len{tensor->total_size()}
  {
    assert(tensor->layout() == ir::Layout::NCHW);

    const auto start_offset = tensor->calcOffset({0, 0, 0, 0});
    auto shape = tensor->getShape();
    _strides.W = shape.dim(3) == 1 ? 0 : tensor->calcOffset({0, 0, 0, 1}) - start_offset;
    _strides.H = shape.dim(2) == 1 ? 0 : tensor->calcOffset({0, 0, 1, 0}) - start_offset;
    _strides.C = shape.dim(1) == 1 ? 0 : tensor->calcOffset({0, 1, 0, 0}) - start_offset;
    _strides.N = shape.dim(0) == 1 ? 0 : tensor->calcOffset({1, 0, 0, 0}) - start_offset;

    _shape.W = shape.dim(3);
    _shape.H = shape.dim(2);
    _shape.C = shape.dim(1);
    _shape.N = shape.dim(0);
  }

public:
  T at(uint32_t batch, uint32_t ch, uint32_t row, uint32_t col) const final
  {
    return getRef(batch, ch, row, col);
  }
  T at(uint32_t ch, uint32_t row, uint32_t col) const final { return getRef(0, ch, row, col); }

protected:
  const T &getRef(uint32_t batch, uint32_t ch, uint32_t row, uint32_t col) const
  {
    const auto offset = feature_index_to_byte_offset(batch, ch, row, col);

    const T *ptr = reinterpret_cast<const T *>(_ptr + offset);

    return *ptr;
  }

private:
  size_t feature_index_to_byte_offset(uint32_t batch, uint32_t ch, uint32_t row, uint32_t col) const
  {
    assert(1u * _shape.N > batch); // shape.N > batch
    assert(1u * _shape.C > ch);    // shape.C > ch
    assert(1u * _shape.H > row);   // shape.H > row
    assert(1u * _shape.W > col);   // shape.W > col

    uint32_t res = 0;
    res += batch * _strides.N;
    res += ch * _strides.C;
    res += row * _strides.H;
    res += col * _strides.W;

    return res;
  }

private:
  // TODO Remove _shape
  ir::FeatureShape _shape;
  Strides _strides;
  const uint8_t *_ptr;
  size_t _len;
};

} // namespace nchw
} // namespace feature
} // namespace exec
} // namespace onert

#endif // __ONERT_EXEC_FEATURE_NCHW_READER_H__