/third_party/mindspore/mindspore/lite/src/runtime/kernel/arm/fp32/ |
D | convolution_slidewindow_fp32.cc | 47 int oc_block_num = UP_DIV(output_channel, oc_tile_); in Init() local 48 int pack_weight_size = oc_block_num * oc_tile_ * input_channel * kernel_plane; in Init() 142 int oc_block_num = UP_DIV(out_channel, oc_tile_); in InitTmpBuffer() local 146 oc_block_num * oc_tile_ * sizeof(float))); in InitTmpBuffer() 194 int oc_block_num = UP_DIV(output_channel, oc_tile_); in PackWeight() local 197 PackNHWCToNXHWCXFp32(kernel_h, kernel_w, output_channel, oc_block_num, input_channel, in PackWeight() 210 int oc_block_num = UP_DIV(output_channel, oc_tile_); in MallocWeightBiasData() local 211 int pack_weight_size = oc_block_num * oc_tile_ * input_channel * kernel_plane; in MallocWeightBiasData() 222 bias_data_ = malloc(oc_block_num * oc_tile_ * sizeof(float)); in MallocWeightBiasData() 227 memset(bias_data_, 0, oc_block_num * oc_tile_ * sizeof(float)); in MallocWeightBiasData()
|
D | adder_fp32.cc | 78 int oc_block_num = UP_DIV(out_channel, C4NUM); in InitWeightBias() local 79 int pack_weight_size = oc_block_num * oc_block * in_channel * kernel_plane; in InitWeightBias() 91 CHECK_LESS_RETURN(MAX_MALLOC_SIZE, oc_block_num * oc_block * sizeof(float)); in InitWeightBias() 92 bias_data_ = reinterpret_cast<float *>(malloc(oc_block_num * oc_block * sizeof(float))); in InitWeightBias() 97 memset(bias_data_, 0, oc_block_num * oc_block * sizeof(float)); in InitWeightBias()
|
D | convolution_fp32.cc | 85 size_t oc_block_num = UP_ROUND(out_channel, OC_BLOCK); in Init() local 87 size_t pack_weight_size = oc_block_num * in_channel * kernel_plane; in Init() 207 size_t oc_block_num = UP_ROUND(out_channel, OC_BLOCK); in MallocWeightBiasData() local 209 size_t pack_weight_size = oc_block_num * in_channel * kernel_plane; in MallocWeightBiasData() 220 bias_data_ = malloc(oc_block_num * sizeof(float)); in MallocWeightBiasData() 226 memset(bias_data_, 0, oc_block_num * sizeof(float)); in MallocWeightBiasData()
|
D | matmul_fp32_base.cc | 421 int oc_block_num = UP_DIV(out_channel, col_tile_); in InitTmpOutBuffer() local 424 params_->batch * params_->row_ * oc_block_num * col_tile_ * static_cast<int>(sizeof(float)))); in InitTmpOutBuffer()
|
D | lstm_fp32.cc | 311 int oc_block_num = UP_DIV(out_channel, state_col_tile_); in MallocRunBuffer() local 314 …ms_context_->allocator->Malloc(lstm_param_->batch_ * oc_block_num * state_col_tile_ * sizeof(float… in MallocRunBuffer()
|
/third_party/mindspore/mindspore/lite/src/runtime/kernel/arm/fp16/ |
D | convolution_winograd_fp16.cc | 41 int oc_block_num = UP_DIV(out_channel, col_tile_); in MallocWeightBiasData() local 43 …auto trans_matrix_data_size = input_unit_ * input_unit_ * in_channel * oc_block_num * col_tile_ * … in MallocWeightBiasData() 71 bias_data_ = malloc(oc_block_num * col_tile_ * sizeof(float16_t)); in MallocWeightBiasData() 77 memset(bias_data_, 0, oc_block_num * col_tile_ * sizeof(float16_t)); in MallocWeightBiasData() 155 int oc_block_num = UP_DIV(out_channel, col_tile_); in Init() local 156 …auto trans_matrix_data_size = input_unit_ * input_unit_ * in_channel * oc_block_num * col_tile_ * … in Init()
|
/third_party/mindspore/mindspore/lite/micro/coder/opcoders/nnacl/fp32/ |
D | convolution_fp32_coder.cc | 70 int oc_block_num = UP_ROUND(out_channel, oc_block); in InitWeightBias() local 71 int pack_weight_size = oc_block_num * in_channel * kernel_plane; in InitWeightBias() 95 auto bias_data_size = static_cast<size_t>(oc_block_num * sizeof(float)); in InitWeightBias()
|
D | convolution_winograd_fp32_coder.cc | 131 int oc_block_num = UP_DIV(out_channel, C8NUM); in InitWeightBias() local 133 int trans_matrix_data_size = input_unit_ * input_unit_ * in_channel * oc_block_num * oc_block; in InitWeightBias()
|
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp32/ |
D | pack_fp32.c | 162 void PackNHWCToNXHWCXFp32(int kernel_h, int kernel_w, int output_channel, int oc_block_num, int inp… in PackNHWCToNXHWCXFp32() argument 171 if (oc_block8 != oc_block_num) { in PackNHWCToNXHWCXFp32() 173 oc_remainder_step = (oc_block_num - oc_block8) * C8NUM; in PackNHWCToNXHWCXFp32() 234 void SWPackNHWCToNXHWCXFp32(int kernel_h, int kernel_w, int output_channel, int oc_block_num, int i… in SWPackNHWCToNXHWCXFp32() argument 238 for (int i = 0; i < oc_block_num; i += oc_block) { in SWPackNHWCToNXHWCXFp32() 239 oc_block = MSMIN(C4NUM, oc_block_num - i); // max_tile = 4 in SWPackNHWCToNXHWCXFp32() 433 int oc_block_num = UP_DIV(channel, C8NUM); in PackNHWCToCXHWNXFp32() local 435 for (int i = 0, oc_block = 0; i < oc_block_num; i += oc_block) { in PackNHWCToCXHWNXFp32() 436 oc_block = MSMIN(C3NUM, oc_block_num - i); in PackNHWCToCXHWNXFp32() 483 int oc_block_num = UP_DIV(channel, C8NUM); in PackNHWCToCXHWNXFp32() [all …]
|
D | pack_fp32.h | 64 void PackNHWCToNXHWCXFp32(int kernel_h, int kernel_w, int output_channel, int oc_block_num, int inp… 67 void SWPackNHWCToNXHWCXFp32(int kernel_h, int kernel_w, int output_channel, int oc_block_num, int i…
|
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/base/ |
D | minimal_filtering_generator.c | 261 int oc_block_num = UP_DIV(batch, oc_block); in WinogradWeightTransform() local 263 int block_num_stride = block_stride * oc_block_num; in WinogradWeightTransform()
|
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp16/ |
D | winograd_transform_fp16.c | 211 int oc_block_num = UP_DIV(filter_batch, oc_block); in WinogradWeightTransformFp16() local 213 int block_num_stride = block_stride * oc_block_num; in WinogradWeightTransformFp16()
|