diff options
Diffstat (limited to 'compute/ncnn/src/srcn/conv_sgemm_multithreads.h')
-rw-r--r-- | compute/ncnn/src/srcn/conv_sgemm_multithreads.h | 86 |
1 files changed, 86 insertions, 0 deletions
diff --git a/compute/ncnn/src/srcn/conv_sgemm_multithreads.h b/compute/ncnn/src/srcn/conv_sgemm_multithreads.h new file mode 100644 index 000000000..9c9ce7437 --- /dev/null +++ b/compute/ncnn/src/srcn/conv_sgemm_multithreads.h @@ -0,0 +1,86 @@ +/* + * Copyright (c) 2019 Samsung Electronics Co., Ltd. All Rights Reserved + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +#ifndef __NNFW_SRCN_CONV_SGEMM_MULTITHREADS_H__ +#define __NNFW_SRCN_CONV_SGEMM_MULTITHREADS_H__ + +#include "ncnn/srcn/conv_type.h" +#include "common.h" + +namespace nnfw +{ +namespace srcn +{ + +class conv_sgemm_multithreads +{ +public: + conv_sgemm_multithreads(const convMat_t &in_mat, const convMat_t &weights_mat, convMat_t &out_mat, + const convParams_t &in_param, int num_threads, convType_t conv_type); + ~conv_sgemm_multithreads(); + + void run(); + +private: + void param_init(); + + void compute_rowmajor_colshard(); + void compute_rowmajor_rowshard(); + void compute_colmajor_colshard(); + void compute_colmajor_rowshard(); + + const convMat_t in_mat_; + const convMat_t weights_mat_; + convMat_t out_mat_; + const convParams_t in_param_; + convType_t conv_type_; + int num_threads_; + + int m_; + int n_; +#ifdef WITH_DPU + int np_; +#endif + int k_; + + int bm_; + int bn_; + int bk_; + + int rm_; + int rn_; + int rk_; + + int nm_; + int nn_; + int nk_; + + int mr_; + int nr_; + + int need_im2col_; + shardType_t shard_type_; + + float *prhs_buffer_; + float *plhs_buffer_; + + int error_; +}; + +} // namespace srcn +} // namespace nnfw + +#endif // __NNFW_SRCN_CONV_SGEMM_MULTITHREADS_H__ |