compiler/locomotiv/src/Node/DepthwiseFilterEncode.test.cpp


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90

/*
 * Copyright (c) 2019 Samsung Electronics Co., Ltd. All Rights Reserved
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include "NodeExecution.h"

#include "locomotiv/NodeData.h"
#include "NodeDataImpl.h"
#include "NodeDomain.h"

#include <loco/IR/PermutingCodec.h>

#include <nncc/core/ADT/tensor/Shape.h>
#include <nncc/core/ADT/tensor/Buffer.h>
#include <nncc/core/ADT/tensor/LexicalLayout.h>
#include <nncc/core/ADT/tensor/IndexEnumerator.h>

#include <gtest/gtest.h>

using nncc::core::ADT::tensor::Index;
using nncc::core::ADT::tensor::Shape;
using nncc::core::ADT::tensor::LexicalLayout;
using nncc::core::ADT::tensor::make_buffer;
using nncc::core::ADT::tensor::IndexEnumerator;

TEST(NodeExecution_DepthwiseFilterEncode, f32)
{
  const uint32_t H = 2;
  const uint32_t W = 3;
  const uint32_t C = 4;
  const uint32_t M = 5;

  auto g = loco::make_graph();

  // Pull
  auto pull = g->nodes()->create<loco::Pull>();
  pull->dtype(loco::DataType::FLOAT32);

  // Make and assign "MHWC" data to pull node
  auto pull_buf = make_buffer<float, LexicalLayout>(Shape{M, H, W, C});
  float f = 1;
  for (IndexEnumerator e{pull_buf.shape()}; e.valid(); e.advance())
  {
    pull_buf.at(e.current()) = f;
    f += 0.1f; // Doesn't matter what it is
  }
  auto pull_data = locomotiv::make_data(pull_buf);
  locomotiv::annot_data(pull, std::move(pull_data));
  locomotiv::annot_domain(pull, loco::Domain::Tensor);

  // Encoder to correctly read input tensor as MHWC
  auto encoder = std::unique_ptr<loco::PermutingEncoder<loco::Domain::DepthwiseFilter>>(
      new loco::PermutingEncoder<loco::Domain::DepthwiseFilter>);
  encoder->perm()->axis(loco::DepthwiseFilterAxis::Multiplier) = 0;
  encoder->perm()->axis(loco::DepthwiseFilterAxis::Height) = 1;
  encoder->perm()->axis(loco::DepthwiseFilterAxis::Width) = 2;
  encoder->perm()->axis(loco::DepthwiseFilterAxis::Depth) = 3;

  // DepthwiseFilterEncode
  auto enc = g->nodes()->create<loco::DepthwiseFilterEncode>();
  enc->input(pull);
  enc->encoder(std::move(encoder));

  locomotiv::NodeExecution::get().run(enc);

  auto enc_data = locomotiv::annot_data(enc);
  ASSERT_NE(enc_data, nullptr);
  ASSERT_EQ(enc_data->dtype(), loco::DataType::FLOAT32);
  ASSERT_EQ(*(enc_data->shape()), (Shape{H, W, C, M})); // locomotiv depthwise filter is HWCM
  auto enc_buf = enc_data->as_f32_bufptr();
  for (uint32_t h = 0; h < H; ++h)
    for (uint32_t w = 0; w < W; ++w)
      for (uint32_t c = 0; c < C; ++c)
        for (uint32_t m = 0; m < M; ++m)
          ASSERT_FLOAT_EQ(pull_buf.at(Index{m, h, w, c}), enc_buf->at(Index{h, w, c, m}));

  ASSERT_EQ(locomotiv::annot_domain(enc), loco::Domain::DepthwiseFilter);
}