Home
last modified time | relevance | path

Searched refs:KernelFormat (Results 1 – 14 of 14) sorted by relevance

/external/gemmlowp/internal/
Dblock_params.h45 template <typename KernelFormat>
48 FindL2BlockSizes<KernelFormat>(rows, cols, depth, num_threads, in Init()
51 FindL1BlockSizes<KernelFormat>(l2_rows, l2_cols, l2_depth, l1_bytes_to_use, in Init()
55 template <typename KernelFormat>
65 std::max(1, RoundUp<KernelFormat::kRows>(rows) / num_threads); in FindL2BlockSizes()
80 RoundUp<KernelFormat::kCols>(CeilQuotient(cols, min_l2_cols_blocks)); in FindL2BlockSizes()
87 l2_rows = RoundUp<KernelFormat::kRows>(per_thread_rows); in FindL2BlockSizes()
94 l2_rows = RoundUp<KernelFormat::kRows>( in FindL2BlockSizes()
103 template <typename KernelFormat>
112 assert(rows % KernelFormat::kRows == 0); in FindL1BlockSizes()
[all …]
Dunpack.h89 template <typename KernelFormat, typename RegisterBlockType,
101 using KernelLhsInputScalar = typename KernelFormat::Lhs::InputScalar; in UnpackResultBlock()
102 using KernelLhsScalar = typename KernelFormat::Lhs::Scalar; in UnpackResultBlock()
103 using KernelRhsInputScalar = typename KernelFormat::Rhs::InputScalar; in UnpackResultBlock()
104 using KernelRhsScalar = typename KernelFormat::Rhs::Scalar; in UnpackResultBlock()
129 template <typename KernelFormat, typename ResultBlockType,
187 UnpackResultBlock<KernelFormat, Int32x8x4>( in UnpackResult()
200 UnpackResultBlock<KernelFormat, Int32x4x4>( in UnpackResult()
212 UnpackResultBlock<KernelFormat, Int32x1x4>( in UnpackResult()
229 UnpackResultBlock<KernelFormat, Int32x8x4>( in UnpackResult()
[all …]
Dkernel_neon.h35 typedef KernelFormat<KernelSideFormat<CellFormat<4, 2>, 3>,
295 typedef KernelFormat<
670 typedef KernelFormat<
932 typedef KernelFormat<
944 typedef KernelFormat<
1284 typedef KernelFormat<
1292 typedef KernelFormat<KernelSideFormat<CellFormat<4, 2>, 3>,
1666 typedef KernelFormat<KernelSideFormat<CellFormat<4, 4, CellOrder::WidthMajor>, 3>,
Dsingle_thread_gemm.h62 template <typename KernelFormat, typename InputScalar, typename OutputScalar,
92 block_params.Init<KernelFormat>( in SingleThreadGemm()
115 PackedSideBlock<typename KernelFormat::Lhs> packed_lhs(Side::Lhs, allocator, in SingleThreadGemm()
117 PackedSideBlock<typename KernelFormat::Rhs> packed_rhs(Side::Rhs, allocator, in SingleThreadGemm()
145 UnpackResult<KernelFormat>( in SingleThreadGemm()
Dmulti_thread_gemm.h462 template <typename KernelFormat, typename InputScalar, typename OutputScalar,
467 typedef PackedSideBlock<typename KernelFormat::Lhs> PackedLhs;
468 typedef PackedSideBlock<typename KernelFormat::Rhs> PackedRhs;
515 UnpackResult<KernelFormat>( in Run()
632 template <typename KernelFormat, typename InputScalar, typename OutputScalar,
658 const int thread_count = HowManyThreads<KernelFormat::kRows>( in MultiThreadGemm()
661 return SingleThreadGemm<KernelFormat, InputScalar, OutputScalar, in MultiThreadGemm()
677 block_params.Init<KernelFormat>( in MultiThreadGemm()
681 PackedSideBlock<typename KernelFormat::Rhs> packed_rhs(Side::Rhs, allocator, in MultiThreadGemm()
698 rows, RoundUp<KernelFormat::kRows>(rows * (n + 1) / task_count)); in MultiThreadGemm()
[all …]
Dkernel_sse.h33 typedef KernelFormat<
208 typedef KernelFormat<
Dkernel_msa.h45 typedef KernelFormat<KernelSideFormat<CellFormat<4, 2, CellOrder::WidthMajor>, 3>,
282 typedef KernelFormat<
Dkernel_avx.h32 typedef KernelFormat<KernelSideFormat<CellFormat<8, 2, CellOrder::WidthMajor>, 3>,
Dkernel_default.h104 typedef ReferenceKernel<KernelFormat<
Dkernel.h171 struct KernelFormat { struct
Dcompute.h32 typedef KernelFormat<KernelLhsFormat, KernelRhsFormat> Format;
/external/gemmlowp/standalone/
Dneon-gemm-kernel-benchmark.cc233 struct KernelFormat { struct
329 typedef KernelFormat<
518 typedef KernelFormat<
636 typedef KernelFormat<
882 typedef KernelFormat<
967 typedef KernelFormat<
1054 typedef KernelFormat<
1140 typedef KernelFormat<
1226 typedef KernelFormat<
1369 typedef KernelFormat<
[all …]
/external/gemmlowp/test/
Dtest.cc1613 ReferenceKernel<KernelFormat<KernelSideFormat<CellFormat<1, 1>, 1>, in TestKernels()
1618 ReferenceKernel<KernelFormat<KernelSideFormat<CellFormat<4, 2>, 1>, in TestKernels()
1623 ReferenceKernel<KernelFormat<KernelSideFormat<CellFormat<4, 2>, 4>, in TestKernels()
1627 test_gemm_kernel<ReferenceKernel<KernelFormat< in TestKernels()
1631 test_gemm_kernel<ReferenceKernel<KernelFormat< in TestKernels()
1635 test_gemm_kernel<ReferenceKernel<KernelFormat< in TestKernels()
1639 test_gemm_kernel<ReferenceKernel<KernelFormat< in TestKernels()
1643 test_gemm_kernel<ReferenceKernel<KernelFormat< in TestKernels()
1647 test_gemm_kernel<ReferenceKernel<KernelFormat< in TestKernels()
/external/gemmlowp/doc/
Dkernel.md37 typedef KernelFormat<KernelSideFormat<CellFormat<4, 2>, 3>,