plain/documentation/graph__resnet50_8cpp_source.xhtml

 /*
  * Copyright (c) 2017-2018 ARM Limited.
  *
  * SPDX-License-Identifier: MIT
  *
  * Permission is hereby granted, free of charge, to any person obtaining a copy
  * of this software and associated documentation files (the "Software"), to
  * deal in the Software without restriction, including without limitation the
  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
  * sell copies of the Software, and to permit persons to whom the Software is
  * furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included in all
  * copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  * SOFTWARE.
  */
 #include "arm_compute/graph.h"
 #include "support/ToolchainSupport.h"
 #include "utils/GraphUtils.h"
 #include "utils/Utils.h"

 #include <cstdlib>

 using namespace arm_compute::utils;
 using namespace arm_compute::graph::frontend;
 using namespace arm_compute::graph_utils;

 class GraphResNet50Example : public Example
 {
 public:
     void do_setup(int argc, char **argv) override
     {
         std::string data_path; /* Path to the trainable data */
         std::string image;     /* Image data */
         std::string label;     /* Label data */

         // Create a preprocessor object
         const std::array<float, 3> mean_rgb{ { 122.68f, 116.67f, 104.01f } };
         std::unique_ptr<IPreprocessor> preprocessor = arm_compute::support::cpp14::make_unique<CaffePreproccessor>(mean_rgb,
                                                                                                                    false /* Do not convert to BGR */);

         // Set target. 0 (NEON), 1 (OpenCL), 2 (OpenCL with Tuner). By default it is NEON
         const int    target         = argc > 1 ? std::strtol(argv[1], nullptr, 10) : 0;
         Target       target_hint    = set_target_hint(target);
         FastMathHint fast_math_hint = FastMathHint::DISABLED;

         // Parse arguments
         if(argc < 2)
         {
             // Print help
             std::cout << "Usage: " << argv[0] << " [target] [path_to_data] [image] [labels] [fast_math_hint]\n\n";
             std::cout << "No data folder provided: using random values\n\n";
         }
         else if(argc == 2)
         {
             std::cout << "Usage: " << argv[0] << " " << argv[1] << " [path_to_data] [image] [labels] [fast_math_hint]\n\n";
             std::cout << "No data folder provided: using random values\n\n";
         }
         else if(argc == 3)
         {
             data_path = argv[2];
             std::cout << "Usage: " << argv[0] << " " << argv[1] << " " << argv[2] << " [image] [labels] [fast_math_hint]\n\n";
             std::cout << "No image provided: using random values\n\n";
         }
         else if(argc == 4)
         {
             data_path = argv[2];
             image     = argv[3];
             std::cout << "Usage: " << argv[0] << " " << argv[1] << " " << argv[2] << " " << argv[3] << " [labels] [fast_math_hint]\n\n";
             std::cout << "No text file with labels provided: skipping output accessor\n\n";
         }
         else if(argc == 5)
         {
             data_path = argv[2];
             image     = argv[3];
             label     = argv[4];
             std::cout << "Usage: " << argv[0] << " " << argv[1] << " " << argv[2] << " " << argv[3] << " " << argv[4] << " [fast_math_hint]\n\n";
             std::cout << "No fast math info provided: disabling fast math\n\n";
         }
         else
         {
             data_path      = argv[2];
             image          = argv[3];
             label          = argv[4];
             fast_math_hint = (std::strtol(argv[5], nullptr, 1) == 0) ? FastMathHint::DISABLED : FastMathHint::ENABLED;
         }

         graph << target_hint
               << fast_math_hint
               << InputLayer(TensorDescriptor(TensorShape(224U, 224U, 3U, 1U), DataType::F32),
                             get_input_accessor(image, std::move(preprocessor), false /* Do not convert to BGR */))
               << ConvolutionLayer(
                   7U, 7U, 64U,
                   get_weights_accessor(data_path, "/cnn_data/resnet50_model/conv1_weights.npy"),
                   std::unique_ptr<arm_compute::graph::ITensorAccessor>(nullptr),
                   PadStrideInfo(2, 2, 3, 3))
               .set_name("conv1/convolution")
               << BatchNormalizationLayer(
                   get_weights_accessor(data_path, "/cnn_data/resnet50_model/conv1_BatchNorm_moving_mean.npy"),
                   get_weights_accessor(data_path, "/cnn_data/resnet50_model/conv1_BatchNorm_moving_variance.npy"),
                   get_weights_accessor(data_path, "/cnn_data/resnet50_model/conv1_BatchNorm_gamma.npy"),
                   get_weights_accessor(data_path, "/cnn_data/resnet50_model/conv1_BatchNorm_beta.npy"),
                   0.0000100099996416f)
               .set_name("conv1/BatchNorm")
               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv1/Relu")
               << PoolingLayer(PoolingLayerInfo(PoolingType::MAX, 3, PadStrideInfo(2, 2, 0, 1, 0, 1, DimensionRoundingType::FLOOR))).set_name("pool1/MaxPool");

         add_residual_block(data_path, "block1", 64, 3, 2);
         add_residual_block(data_path, "block2", 128, 4, 2);
         add_residual_block(data_path, "block3", 256, 6, 2);
         add_residual_block(data_path, "block4", 512, 3, 1);

         graph << PoolingLayer(PoolingLayerInfo(PoolingType::AVG)).set_name("pool5")
               << ConvolutionLayer(
                   1U, 1U, 1000U,
                   get_weights_accessor(data_path, "/cnn_data/resnet50_model/logits_weights.npy"),
                   get_weights_accessor(data_path, "/cnn_data/resnet50_model/logits_biases.npy"),
                   PadStrideInfo(1, 1, 0, 0))
               .set_name("logits/convolution")
               << FlattenLayer().set_name("predictions/Reshape")
               << SoftmaxLayer().set_name("predictions/Softmax")
               << OutputLayer(get_output_accessor(label, 5));

         // Finalize graph
         GraphConfig config;
         config.use_tuner = (target == 2);
         graph.finalize(target_hint, config);
     }

     void do_run() override
     {
         // Run graph
         graph.run();
     }

 private:
     Stream graph{ 0, "ResNet50" };

     void add_residual_block(const std::string &data_path, const std::string &name, unsigned int base_depth, unsigned int num_units, unsigned int stride)
     {
         for(unsigned int i = 0; i < num_units; ++i)
         {
             std::stringstream unit_path_ss;
             unit_path_ss << "/cnn_data/resnet50_model/" << name << "_unit_" << (i + 1) << "_bottleneck_v1_";
             std::stringstream unit_name_ss;
             unit_name_ss << name << "/unit" << (i + 1) << "/bottleneck_v1/";

             std::string unit_path = unit_path_ss.str();
             std::string unit_name = unit_name_ss.str();

             unsigned int middle_stride = 1;

             if(i == (num_units - 1))
             {
                 middle_stride = stride;
             }

             SubStream right(graph);
             right << ConvolutionLayer(
                       1U, 1U, base_depth,
                       get_weights_accessor(data_path, unit_path + "conv1_weights.npy"),
                       std::unique_ptr<arm_compute::graph::ITensorAccessor>(nullptr),
                       PadStrideInfo(1, 1, 0, 0))
                   .set_name(unit_name + "conv1/convolution")
                   << BatchNormalizationLayer(
                       get_weights_accessor(data_path, unit_path + "conv1_BatchNorm_moving_mean.npy"),
                       get_weights_accessor(data_path, unit_path + "conv1_BatchNorm_moving_variance.npy"),
                       get_weights_accessor(data_path, unit_path + "conv1_BatchNorm_gamma.npy"),
                       get_weights_accessor(data_path, unit_path + "conv1_BatchNorm_beta.npy"),
                       0.0000100099996416f)
                   .set_name(unit_name + "conv1/BatchNorm")
                   << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name(unit_name + "conv1/Relu")

                   << ConvolutionLayer(
                       3U, 3U, base_depth,
                       get_weights_accessor(data_path, unit_path + "conv2_weights.npy"),
                       std::unique_ptr<arm_compute::graph::ITensorAccessor>(nullptr),
                       PadStrideInfo(middle_stride, middle_stride, 1, 1))
                   .set_name(unit_name + "conv2/convolution")
                   << BatchNormalizationLayer(
                       get_weights_accessor(data_path, unit_path + "conv2_BatchNorm_moving_mean.npy"),
                       get_weights_accessor(data_path, unit_path + "conv2_BatchNorm_moving_variance.npy"),
                       get_weights_accessor(data_path, unit_path + "conv2_BatchNorm_gamma.npy"),
                       get_weights_accessor(data_path, unit_path + "conv2_BatchNorm_beta.npy"),
                       0.0000100099996416f)
                   .set_name(unit_name + "conv2/BatchNorm")
                   << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name(unit_name + "conv1/Relu")

                   << ConvolutionLayer(
                       1U, 1U, base_depth * 4,
                       get_weights_accessor(data_path, unit_path + "conv3_weights.npy"),
                       std::unique_ptr<arm_compute::graph::ITensorAccessor>(nullptr),
                       PadStrideInfo(1, 1, 0, 0))
                   .set_name(unit_name + "conv3/convolution")
                   << BatchNormalizationLayer(
                       get_weights_accessor(data_path, unit_path + "conv3_BatchNorm_moving_mean.npy"),
                       get_weights_accessor(data_path, unit_path + "conv3_BatchNorm_moving_variance.npy"),
                       get_weights_accessor(data_path, unit_path + "conv3_BatchNorm_gamma.npy"),
                       get_weights_accessor(data_path, unit_path + "conv3_BatchNorm_beta.npy"),
                       0.0000100099996416f)
                   .set_name(unit_name + "conv2/BatchNorm");

             if(i == 0)
             {
                 SubStream left(graph);
                 left << ConvolutionLayer(
                          1U, 1U, base_depth * 4,
                          get_weights_accessor(data_path, unit_path + "shortcut_weights.npy"),
                          std::unique_ptr<arm_compute::graph::ITensorAccessor>(nullptr),
                          PadStrideInfo(1, 1, 0, 0))
                      .set_name(unit_name + "shortcut/convolution")
                      << BatchNormalizationLayer(
                          get_weights_accessor(data_path, unit_path + "shortcut_BatchNorm_moving_mean.npy"),
                          get_weights_accessor(data_path, unit_path + "shortcut_BatchNorm_moving_variance.npy"),
                          get_weights_accessor(data_path, unit_path + "shortcut_BatchNorm_gamma.npy"),
                          get_weights_accessor(data_path, unit_path + "shortcut_BatchNorm_beta.npy"),
                          0.0000100099996416f)
                      .set_name(unit_name + "shortcut/BatchNorm");

                 graph << BranchLayer(BranchMergeMethod::ADD, std::move(left), std::move(right)).set_name(unit_name + "add");
             }
             else if(middle_stride > 1)
             {
                 SubStream left(graph);
                 left << PoolingLayer(PoolingLayerInfo(PoolingType::MAX, 1, PadStrideInfo(middle_stride, middle_stride, 0, 0), true)).set_name(unit_name + "shortcut/MaxPool");

                 graph << BranchLayer(BranchMergeMethod::ADD, std::move(left), std::move(right)).set_name(unit_name + "add");
             }
             else
             {
                 SubStream left(graph);
                 graph << BranchLayer(BranchMergeMethod::ADD, std::move(left), std::move(right)).set_name(unit_name + "add");
             }

             graph << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name(unit_name + "Relu");
         }
     }
 };

 int main(int argc, char **argv)
 {
     return arm_compute::utils::run_example<GraphResNet50Example>(argc, argv);
 }
arm_compute::graph::frontend::BranchLayer
Branch Layer.
Definition: Layers.h:435

arm_compute::graph::frontend::PoolingLayer
Pooling Layer.
Definition: Layers.h:336

arm_compute::graph_utils::set_target_hint
graph::Target set_target_hint(int target)
Utility function to return the TargetHint.
Definition: GraphUtils.h:370

arm_compute::graph::frontend::SubStream
Sub stream class.
Definition: SubStream.h:47

ToolchainSupport.h

arm_compute::ActivationLayerInfo::ActivationFunction::RELU
Rectifier (  )

arm_compute::graph_utils::get_output_accessor
std::unique_ptr< graph::ITensorAccessor > get_output_accessor(const std::string &labels_path, size_t top_n=5, std::ostream &output_stream=std::cout)
Generates appropriate output accessor according to the specified labels_path.
Definition: GraphUtils.h:330

Utils.h

arm_compute::DimensionRoundingType::FLOOR
Floor rounding.

arm_compute::Format::F32
1 channel, 1 F32 per channel

main
int main(int argc, char **argv)
Main program for ResNet50.
Definition: graph_resnet50.cpp:257

arm_compute::graph::frontend::InputLayer
Input Layer.
Definition: Layers.h:45

GraphUtils.h

graph.h

arm_compute::utils::Example
Abstract Example class.
Definition: Utils.h:62

arm_compute::graph_utils::get_input_accessor
std::unique_ptr< graph::ITensorAccessor > get_input_accessor(const std::string &ppm_path, std::unique_ptr< IPreprocessor > preprocessor=nullptr, bool bgr=true)
Generates appropriate input accessor according to the specified ppm_path.
Definition: GraphUtils.h:299

arm_compute::FixedPointOp::ADD
Addition.

arm_compute::graph::frontend::ActivationLayer
Activation Layer.
Definition: Layers.h:94

arm_compute::graph::Target
Target
Definition: Types.h:84

arm_compute::graph::frontend::ConvolutionLayer
Convolution Layer.
Definition: Layers.h:158

arm_compute::graph::FastMathHint
FastMathHint
Enable or disable fast math for Convolution layer.
Definition: Types.h:118

arm_compute::utils
Definition: Cast.h:31

arm_compute::graph_utils
Definition: GraphUtils.h:41

arm_compute::graph::frontend::SoftmaxLayer
Softmax Layer.
Definition: Layers.h:411

arm_compute::PoolingType::AVG
Average Pooling.

arm_compute::graph::frontend::OutputLayer
Output Layer.
Definition: Layers.h:70

arm_compute::graph_utils::get_weights_accessor
std::unique_ptr< graph::ITensorAccessor > get_weights_accessor(const std::string &path, const std::string &data_file, DataLayout file_layout=DataLayout::NCHW)
Generates appropriate weights accessor according to the specified path.
Definition: GraphUtils.h:275

arm_compute::graph::frontend::Stream
Stream frontend class to construct simple graphs in a stream fashion.
Definition: Stream.h:45

arm_compute::graph::frontend
Definition: ILayer.h:31

arm_compute::graph::frontend::BatchNormalizationLayer
Batchnormalization Layer.
Definition: Layers.h:118

arm_compute::NonLinearFilterFunction::MAX
Non linear dilate.

arm_compute::graph::frontend::FlattenLayer
Flatten Layer.
Definition: Layers.h:264

arm_compute::graph::frontend::ILayer::set_name
ILayer & set_name(std::string name)
Sets the name of the layer.
Definition: ILayer.h:55