/external/gemmlowp/meta/ |
D | multi_thread_gemm.h | 29 std::uint8_t* PrepareGemmTask(const Params& params, int kernel_m, int kernel_n, in PrepareGemmTask() argument 53 task, kernel_m, kernel_n, kernel_k); in PrepareGemmTask() 58 int kernel_m, int kernel_n, int kernel_k, in PrepareGemmTasks() argument 81 params, kernel_m, kernel_n, kernel_k, scratch, i * m_chunk, m_chunk, in PrepareGemmTasks() 85 PrepareGemmTask<Executor, Params>(params, kernel_m, kernel_n, kernel_k, in PrepareGemmTasks() 92 params, kernel_m, kernel_n, kernel_k, scratch, 0, params.m, in PrepareGemmTasks() 96 PrepareGemmTask<Executor, Params>(params, kernel_m, kernel_n, kernel_k, in PrepareGemmTasks() 104 template <typename Executor, typename Params, int kernel_m, int kernel_n, 110 Gemm<Executor, Params, kernel_m, kernel_n, kernel_k>(params); in Run() 119 int kernel_m, int kernel_n, int kernel_k> [all …]
|
D | single_thread_gemm.h | 24 template <typename Executor, typename Params, int kernel_m, int kernel_n, 31 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument 35 params.left_stream, kernel_m, kernel_k); in EstimateScratchSize() 220 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument 222 const int lhs_chunks = ((params.m + kernel_m - 1) / kernel_m); in EstimateScratchSize() 226 params.left_stream, kernel_m, kernel_k); in EstimateScratchSize() 441 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument 490 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument 676 template <typename Executor, typename Params, int kernel_m, int kernel_n, 679 internal::Dispatch3DStage1<Executor, Params, kernel_m, kernel_n, kernel_k, [all …]
|
D | base.h | 101 typename OutputStream, int kernel_m, int kernel_n, int pack_size>
|
/external/gemmlowp/meta/generators/ |
D | quantized_mul_kernels_common.py | 53 def Prepare(self, emitter, registers, kernel_m, kernel_n, lhs, rhs): argument 58 lhs_offset = _ReadParams(emitter, registers, lhs, kernel_m, 4) 71 self.lhs_offsets = _Duplicate(emitter, registers, kernel_m, lhs_offset) 130 def Prepare(self, emitter, registers, kernel_m, kernel_n, lhs, rhs): argument 134 lhs_offset = _ReadParams(emitter, registers, lhs, kernel_m, 4) 136 self.lhs_offsets = _Duplicate(emitter, registers, kernel_m, lhs_offset) 162 def Prepare(self, emitter, registers, kernel_m, kernel_n, lhs, rhs): argument 166 lhs_offset = _ReadParams(emitter, registers, lhs, kernel_m, 4) 171 self.lhs_offsets = _Duplicate(emitter, registers, kernel_m, lhs_offset) 205 def Prepare(self, emitter, registers, kernel_m, unused_kernel_n, argument [all …]
|
D | common.py | 94 def SpecializeMulKernel(self, in_type, out_type, kernel_m, kernel_n, argument 98 in_type, out_type, self.kernel_name, self.output_stream_name, kernel_m, 111 self.EmitMultiply(in_type, out_type, kernel_m, kernel_n, pack_size)
|