Home
last modified time | relevance | path

Searched refs:kernel_m (Results 1 – 5 of 5) sorted by relevance

/external/gemmlowp/meta/
Dmulti_thread_gemm.h29 std::uint8_t* PrepareGemmTask(const Params& params, int kernel_m, int kernel_n, in PrepareGemmTask() argument
53 task, kernel_m, kernel_n, kernel_k); in PrepareGemmTask()
58 int kernel_m, int kernel_n, int kernel_k, in PrepareGemmTasks() argument
81 params, kernel_m, kernel_n, kernel_k, scratch, i * m_chunk, m_chunk, in PrepareGemmTasks()
85 PrepareGemmTask<Executor, Params>(params, kernel_m, kernel_n, kernel_k, in PrepareGemmTasks()
92 params, kernel_m, kernel_n, kernel_k, scratch, 0, params.m, in PrepareGemmTasks()
96 PrepareGemmTask<Executor, Params>(params, kernel_m, kernel_n, kernel_k, in PrepareGemmTasks()
104 template <typename Executor, typename Params, int kernel_m, int kernel_n,
110 Gemm<Executor, Params, kernel_m, kernel_n, kernel_k>(params); in Run()
119 int kernel_m, int kernel_n, int kernel_k>
[all …]
Dsingle_thread_gemm.h24 template <typename Executor, typename Params, int kernel_m, int kernel_n,
31 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument
35 params.left_stream, kernel_m, kernel_k); in EstimateScratchSize()
220 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument
222 const int lhs_chunks = ((params.m + kernel_m - 1) / kernel_m); in EstimateScratchSize()
226 params.left_stream, kernel_m, kernel_k); in EstimateScratchSize()
441 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument
490 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument
676 template <typename Executor, typename Params, int kernel_m, int kernel_n,
679 internal::Dispatch3DStage1<Executor, Params, kernel_m, kernel_n, kernel_k,
[all …]
Dbase.h101 typename OutputStream, int kernel_m, int kernel_n, int pack_size>
/external/gemmlowp/meta/generators/
Dquantized_mul_kernels_common.py53 def Prepare(self, emitter, registers, kernel_m, kernel_n, lhs, rhs): argument
58 lhs_offset = _ReadParams(emitter, registers, lhs, kernel_m, 4)
71 self.lhs_offsets = _Duplicate(emitter, registers, kernel_m, lhs_offset)
130 def Prepare(self, emitter, registers, kernel_m, kernel_n, lhs, rhs): argument
134 lhs_offset = _ReadParams(emitter, registers, lhs, kernel_m, 4)
136 self.lhs_offsets = _Duplicate(emitter, registers, kernel_m, lhs_offset)
162 def Prepare(self, emitter, registers, kernel_m, kernel_n, lhs, rhs): argument
166 lhs_offset = _ReadParams(emitter, registers, lhs, kernel_m, 4)
171 self.lhs_offsets = _Duplicate(emitter, registers, kernel_m, lhs_offset)
205 def Prepare(self, emitter, registers, kernel_m, unused_kernel_n, argument
[all …]
Dcommon.py94 def SpecializeMulKernel(self, in_type, out_type, kernel_m, kernel_n, argument
98 in_type, out_type, self.kernel_name, self.output_stream_name, kernel_m,
111 self.EmitMultiply(in_type, out_type, kernel_m, kernel_n, pack_size)