Searched refs:tile_n (Results 1 – 4 of 4) sorted by relevance
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp16/ |
D | conv_fp16.c | 27 const int tile_n = 16; in ConvFp16() local 29 const int tile_n = 12; in ConvFp16() 32 NNACL_CHECK_ZERO_RETURN(tile_n); in ConvFp16() 34 int block_per_thread = UP_DIV(UP_DIV(output_hw, tile_n), conv_param->thread_num_); in ConvFp16() 36 int start_hw = start_block * tile_n; in ConvFp16() 37 int end_hw = MSMIN(output_hw, (start_block + block_per_thread) * tile_n); in ConvFp16() 41 int out_stride = conv_param->output_channel_ * tile_n; in ConvFp16() 43 packed_input += task_id * deep * tile_n; in ConvFp16() 44 col_major_input += task_id * deep * tile_n; in ConvFp16() 45 size_t input_size = deep * tile_n * sizeof(float16_t); in ConvFp16() [all …]
|
/third_party/mindspore/mindspore/lite/test/ut/src/runtime/kernel/arm/common/ |
D | pack_tests.cc | 73 int tile_n = 8; in TEST_F() local 75 int output_tile_count = UP_DIV(output_count, tile_n); in TEST_F() 81 int packed_input_size = output_tile_count * tile_n * unit_size; in TEST_F() 90 int start_index = thread_id * tile_n; in TEST_F() 91 int real_cal_num = (output_count - start_index) < tile_n ? (output_count - tile_n) : tile_n; in TEST_F() 93 … reinterpret_cast<float *>(packed_input) + thread_id * unit_size * tile_n + gemm_in_batch_offset; in TEST_F() 136 int tile_n = 16; in TEST_F() local 138 int output_tile_count = UP_DIV(output_count, tile_n); in TEST_F() 144 int packed_input_size = output_tile_count * tile_n * unit_size; in TEST_F() 153 int start_index = thread_id * tile_n; in TEST_F() [all …]
|
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/int8/ |
D | conv_int8.c | 24 int tile_n = conv_param->tile_num_; in ConvInt8() local 26 NNACL_CHECK_ZERO_RETURN(tile_n); in ConvInt8() 27 int output_tile_count = UP_DIV(output_count, tile_n); in ConvInt8() 46 input_sum_offset = tile_n * up_round_oc; in ConvInt8() 49 input_sum_offset = tile_n; in ConvInt8() 57 int start_index = thread_id * tile_n; in ConvInt8() 58 … int real_cal_num = (output_count - start_index) < tile_n ? (output_count - start_index) : tile_n; in ConvInt8() 60 int8_t *gemm_input = packed_input + task_id * unit_size * tile_n; in ConvInt8() 61 int8_t *matmul = matmul_input + task_id * kernel_plane * in_channel * tile_n; in ConvInt8() 62 …(matmul, conv_param->conv_quant_arg_.input_quant_args_[0].zp_, kernel_plane * in_channel * tile_n); in ConvInt8() [all …]
|
/third_party/mesa3d/src/gallium/drivers/freedreno/ |
D | freedreno_gmem.c | 289 int tile_n[npipes]; in gmem_stateobj_init() local 385 memset(tile_n, 0, sizeof(tile_n)); in gmem_stateobj_init() 409 tile->n = !is_a20x(screen) ? tile_n[p]++ in gmem_stateobj_init()
|