Searched refs:packed_rhs (Results 1 – 5 of 5) sorted by relevance
/external/gemmlowp/internal/ |
D | single_thread_gemm.h | 117 PackedSideBlock<typename KernelFormat::Rhs> packed_rhs(Side::Rhs, allocator, in SingleThreadGemm() 127 PackRhs(&packed_rhs, rhs); in SingleThreadGemm() 139 PackRhs(&packed_rhs, rhs.block(0, c, depth, cs)); in SingleThreadGemm() 142 Compute(kernel, block_params, &packed_result, packed_lhs, packed_rhs, in SingleThreadGemm() 147 packed_lhs.sums_of_each_slice(), packed_rhs.sums_of_each_slice(), in SingleThreadGemm()
|
D | multi_thread_gemm.h | 453 packed_rhs(_packed_rhs), in GemmWithPackedRhsTask() 482 Compute(kernel, block_params, &packed_result, packed_lhs, packed_rhs, in Run() 489 packed_lhs.sums_of_each_slice(), packed_rhs.sums_of_each_slice(), in Run() 501 const PackedRhs packed_rhs; member 653 PackedSideBlock<typename KernelFormat::Rhs> packed_rhs(Side::Rhs, allocator, in MultiThreadGemm() 662 PackRhs(&packed_rhs, rhs.block(0, c, depth, cs)); in MultiThreadGemm() 680 new TaskType(context, kernel, lhs_block, packed_rhs, result, in MultiThreadGemm()
|
D | compute.h | 108 const PackedRhs& packed_rhs, int depth) { in Compute() argument 111 kernel, block_params, packed_result, packed_lhs, packed_rhs); in Compute()
|
/external/gemmlowp/meta/ |
D | single_thread_gemm.h | 115 std::uint8_t* packed_rhs = in ExecuteDispatch3D() local 120 std::uint8_t* packed_rhs_chunk = packed_rhs; in ExecuteDispatch3D() 165 packed_rhs_chunk = packed_rhs; in ExecuteDispatch3D() 197 packed_rhs_chunk = packed_rhs; in ExecuteDispatch3D() 301 std::uint8_t* packed_rhs = params.scratch; in ExecuteDispatch3D() local 349 reinterpret_cast<InType*>(packed_rhs)); in ExecuteDispatch3D() 356 reinterpret_cast<const InType*>(packed_rhs), in ExecuteDispatch3D() 365 reinterpret_cast<const InType*>(packed_rhs), in ExecuteDispatch3D() 381 reinterpret_cast<InType*>(packed_rhs)); in ExecuteDispatch3D() 388 reinterpret_cast<const InType*>(packed_rhs), in ExecuteDispatch3D() [all …]
|
/external/gemmlowp/doc/ |
D | design.md | 124 PackRhs(&packed_rhs, rhs.block(0, c, depth, cs)); 127 Compute(kernel, block_params, &packed_result, packed_lhs, packed_rhs); 130 UnpackResult(&result_block, packed_result, packed_lhs, packed_rhs, depth,
|