summaryrefslogtreecommitdiff
path: root/runtimes/neurun/src/backend/acl_cl/Swizzle.h
blob: 838e57162c801580596d936089d2bfbf3bde290d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
/*
 * Copyright (c) 2018 Samsung Electronics Co., Ltd. All Rights Reserved
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#ifndef __NEURUN_BACKEND_ACL_CL_SWIZZLE_H__
#define __NEURUN_BACKEND_ACL_CL_SWIZZLE_H__

#include <cassert>

namespace neurun
{
namespace backend
{
namespace acl_cl
{

class ARMComputeAxis
{
public:
  ARMComputeAxis() = default;

public:
  explicit ARMComputeAxis(uint32_t value) : _value{value}
  {
    // DO NOTHING
  }

public:
  uint32_t value(void) const { return _value; }

private:
  uint32_t _value;
};

// Convert T/F Lite / NNAPI axis (based on ...NHWC) to ARMCompute axis (WHCN...)
inline ARMComputeAxis ToARMComputeAxis(uint32_t rank, uint32_t axis)
{
  assert(rank > axis);
  const ARMComputeAxis reversed{(rank - axis) - 1};

  if (rank < 4)
  {
    return reversed;
  }

  // DEPTH
  if (0 == reversed.value())
  {
    return ARMComputeAxis{2};
  }
  // WIDTH
  if (1 == reversed.value())
  {
    return ARMComputeAxis{0};
  }
  // HEIGHT
  if (2 == reversed.value())
  {
    return ARMComputeAxis{1};
  }

  // ELSE
  return reversed;
}

template <typename T> inline T ReorderBits(T in, size_t numOfBits)
{
  assert(numOfBits > 0);
  T out = 0;
  for (int32_t i = numOfBits - 1; i >= 0; --i)
  {
    const uint32_t toShift = numOfBits - ToARMComputeAxis(numOfBits, i).value() - 1;
    out += ((in & 1) << toShift);
    in >>= 1;
  }
  return out;
}

} // namespace acl_cl
} // namespace backend
} // namespace neurun

#endif // __NEURUN_BACKEND_ACL_CL_SWIZZLE_H__