Searched refs:col_block (Results 1 – 3 of 3) sorted by relevance
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp32/ |
D | matmul_fp32.c | 668 int col_block = C4NUM; in RowMajor2Col32Major() local 669 for (int i = 0; i < col_block_num; i += col_block) { in RowMajor2Col32Major() 670 col_block = MSMIN(C4NUM, col_block_num - i); // max_tile = 4 in RowMajor2Col32Major() 672 int col_remainder = MSMIN(C8NUM * col_block, col - i * C8NUM); in RowMajor2Col32Major() 678 dst_ptr += col_block * C8NUM; in RowMajor2Col32Major() 1075 int col_block = C32NUM; in MatVecMulAvxFp32() local 1085 for (int col_index = 0; col_index < cur_col; col_index += col_block) { in MatVecMulAvxFp32() 1086 col_block = cur_col - col_index < col_block ? cur_col - col_index : col_block; in MatVecMulAvxFp32() 1087 …kernel[(col_block >> 3) - 1](c + col_index, a, b + col_index * depth, bias_data, act_flag, 1, col_… in MatVecMulAvxFp32() 1090 bias_data += col_block; in MatVecMulAvxFp32() [all …]
|
D | matmul_fp32.h | 86 size_t row_block, size_t col_block, size_t col_algin, size_t deep); 90 size_t row_block, size_t col_block, size_t col_algin, size_t deep); 92 size_t row_block, size_t col_block, size_t col_algin, size_t deep); 94 size_t row_block, size_t col_block, size_t col_algin, size_t deep); 96 size_t row_block, size_t col_block, size_t col_algin, size_t deep); 101 size_t row_block, size_t col_block, size_t col_algin, size_t deep);
|
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/intrinsics/avx/ |
D | DeconvMatMulAvx.c | 144 int col_block = UP_DIV(col / plane, C8NUM); in DeconvMatmulAvx() local 146 for (int col_tmp = 0; col_tmp < col_block; col_tmp += col_num) { in DeconvMatmulAvx() 147 col_num = MSMIN(C3NUM, col_block - col_tmp); in DeconvMatmulAvx()
|