diff options
Diffstat (limited to 'runtimes/libs/srcn/src/conv_winograd_batch.h')
-rw-r--r-- | runtimes/libs/srcn/src/conv_winograd_batch.h | 67 |
1 files changed, 67 insertions, 0 deletions
diff --git a/runtimes/libs/srcn/src/conv_winograd_batch.h b/runtimes/libs/srcn/src/conv_winograd_batch.h new file mode 100644 index 000000000..8cf4428bb --- /dev/null +++ b/runtimes/libs/srcn/src/conv_winograd_batch.h @@ -0,0 +1,67 @@ +/* + * Copyright (c) 2019 Samsung Electronics Co., Ltd. All Rights Reserved + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +#ifndef __NNFW_SRCN_CONV_WINOGRAD_BATCH_H__ +#define __NNFW_SRCN_CONV_WINOGRAD_BATCH_H__ + +#include "srcn/conv_type.h" +#include "winograd.h" +#include "sgemm_singlethread.h" + +namespace nnfw +{ +namespace srcn +{ + +class conv_winograd_batch +{ +public: + conv_winograd_batch(const convMat_t &in_mat, convMat_t &out_mat, const convParams_t &in_param, + convType_t conv_type, const float *winograd_weight, int num_threads); + ~conv_winograd_batch(); + + void run(); + +private: + void param_init(); + void compute_sgemm(sgemmType_t major_type, sgemmTrans_t ltrans, sgemmTrans_t rtrans, const int m, + const int n, const int k, const float *lhs_data, const float *rhs_data, + float *res_data); + void winograd_input_im2col(float *col_buff); + void winograd_output_col2im(const float *col_buff); + void compute_winograd(); + + const convMat_t in_mat_; + convMat_t out_mat_; + const convParams_t in_param_; + convType_t conv_type_; + const float *winograd_weight_; + const int num_threads_; + + int tile_w_in_; + int tile_h_in_; + int tile_w_out_; + int tile_h_out_; + int ntiles_w_; + int ntiles_h_; + + int error_; +}; + +} // namespace srcn +} // namespace nnfw + +#endif // __NNFW_SRCN_CONV_WINOGRAD_BATCH_H__ |