Home
last modified time | relevance | path

Searched refs:kCols (Results 1 – 21 of 21) sorted by relevance

/external/ruy/ruy/
Dpack_x86.h81 RUY_DCHECK_EQ((end_col - start_col) % Layout::kCols, 0);
82 RUY_DCHECK_EQ(start_col % Layout::kCols, 0);
84 Scalar zerobuf[Layout::kCols * Layout::kRows];
86 Layout::kCols * Layout::kRows * sizeof(Scalar));
88 block_col += Layout::kCols) {
94 static constexpr int block_col_mask = ~(Layout::kCols - 1); // High bits.
128 RUY_DCHECK_EQ((end_col - start_col) % Layout::kCols, 0);
129 RUY_DCHECK_EQ(start_col % Layout::kCols, 0);
131 Scalar zerobuf[Layout::kCols * Layout::kRows];
133 Layout::kCols * Layout::kRows * sizeof(Scalar));
[all …]
Dkernel.h109 static_assert(is_pot(LhsLayout::kCols), "");
111 static_assert(is_pot(RhsLayout::kCols), "");
120 RUY_DCHECK_LT(end_row, dst->layout.rows + LhsLayout::kCols);
121 RUY_DCHECK_EQ((end_row - start_row) % LhsLayout::kCols, 0);
124 RUY_DCHECK_LT(end_col, dst->layout.cols + RhsLayout::kCols);
125 RUY_DCHECK_EQ((end_col - start_col) % RhsLayout::kCols, 0);
129 for (int col = start_col; col < end_col; col += RhsLayout::kCols) {
130 int block_end_col = std::min(col + RhsLayout::kCols, end_col);
131 for (int row = start_row; row < end_row; row += LhsLayout::kCols) {
132 int block_end_row = std::min(row + LhsLayout::kCols, end_row);
[all …]
Dkernel_arm.h64 KernelParams8bit<LhsLayout::kCols, RhsLayout::kCols> params;
92 KernelParams8bit<LhsLayout::kCols, RhsLayout::kCols> params;
116 KernelParams8bit<LhsLayout::kCols, RhsLayout::kCols> params;
148 KernelParamsFloat<LhsLayout::kCols, RhsLayout::kCols> params;
197 KernelParamsFloat<LhsLayout::kCols, RhsLayout::kCols> params;
Dkernel_x86.h51 KernelParams8bit<LhsLayout::kCols, RhsLayout::kCols> params;
76 KernelParamsFloat<LhsLayout::kCols, RhsLayout::kCols> params;
102 KernelParams8bit<LhsLayout::kCols, RhsLayout::kCols> params;
127 KernelParamsFloat<LhsLayout::kCols, RhsLayout::kCols> params;
152 KernelParamsFloat<LhsLayout::kCols, RhsLayout::kCols> params;
177 KernelParams8bit<LhsLayout::kCols, RhsLayout::kCols> params;
Dperchannel_buffers_reallocation_test.cc81 static_assert(KernelType::LhsLayout::kCols == 16, ""); in TestPerChannelBuffersReallocation()
90 static_assert(KernelType::RhsLayout::kCols == 8, ""); in TestPerChannelBuffersReallocation()
Dpack_avx512.cc69 RUY_DCHECK_EQ(Layout::kCols, 16);
77 packed_ptr[Layout::kCols * Layout::kRows * k + j] = packed_zero_point;
108 RUY_DCHECK_EQ(Layout::kCols, 16);
643 RUY_DCHECK_EQ(kHalfBlockOffset * 2, Layout::kRows * Layout::kCols);
648 RUY_DCHECK_EQ(Layout::kCols, 16);
658 kNumRowChunks * Layout::kCols * Layout::kRows;
695 memcpy(packed_ptr + Layout::kCols * non_trailing_rows, trailing_buf,
696 Layout::kCols * trailing_rows * sizeof(std::int8_t));
Dmat.h468 static constexpr int kCols = tCols; member
476 ret.cols = FixedKernelLayout::kCols; in ToKernelLayout()
485 constexpr int FixedKernelLayout<tOrder, tRows, tCols>::kCols;
Dpack_avx2_fma.cc72 RUY_DCHECK_EQ(Layout::kCols, 8);
552 RUY_DCHECK_EQ(Layout::kCols, 8);
562 kNumRowChunks * Layout::kCols * Layout::kRows;
579 memcpy(packed_ptr + Layout::kCols * non_trailing_rows, trailing_buf,
580 Layout::kCols * trailing_rows * sizeof(std::int8_t));
Dpack.h113 RUY_DCHECK_EQ((end_col - start_col) % FixedKernelLayout::kCols, 0); in Run()
Dpack_avx.cc222 RUY_DCHECK_EQ(Layout::kCols, 8);
694 RUY_DCHECK_EQ(Layout::kCols, 8);
704 kNumRowChunks * Layout::kCols * Layout::kRows;
721 memcpy(packed_ptr + Layout::kCols * non_trailing_rows, trailing_buf,
722 Layout::kCols * trailing_rows * sizeof(std::int8_t));
Dtrace.h566 LhsKernelLayout::kRows, LhsKernelLayout::kCols, \
569 RhsKernelLayout::kRows, RhsKernelLayout::kCols, \
/external/gemmlowp/internal/
Dsimd_wrappers.h65 static constexpr int kCols = tCols; member
66 static constexpr int kScalarCount = kRows * kCols;
138 static constexpr int kCols =
139 Lhs::kCols > Rhs::kCols ? Lhs::kCols : Rhs::kCols;
146 using Type = RegisterBlock<ScalarType, Shape::kRows, Shape::kCols>;
156 static constexpr int Cols = ResultBlockType::kCols;
158 static constexpr int LhsCols = Lhs::kCols;
160 static constexpr int RhsCols = Rhs::kCols;
205 static constexpr int Cols = ResultBlockType::kCols;
207 static constexpr int LhsCols = Lhs::kCols;
[all …]
Dblock_params.h80 RoundUp<KernelFormat::kCols>(CeilQuotient(cols, min_l2_cols_blocks)); in FindL2BlockSizes()
113 assert(cols % KernelFormat::kCols == 0); in FindL1BlockSizes()
122 1, (l1_bytes_to_use - 4 * KernelFormat::kRows * KernelFormat::kCols) / in FindL1BlockSizes()
123 (KernelFormat::kRows + KernelFormat::kCols)); in FindL1BlockSizes()
Dkernel_reference.h52 std::int32_t accumulator[Format::kRows * Format::kCols]; in Run()
98 for (int c = 0; c < Format::kCols; c++) { in Run()
107 for (int c = 0; c < Format::kCols; c++) { in Run()
Dcompute.h84 start_row, start_col, Format::kRows, Format::kCols); in ComputeRun()
94 assert(cols % Format::kCols == 0); in ComputeL1()
97 for (int c = 0; c < cols; c += Format::kCols) { in ComputeL1()
Dkernel.h178 static constexpr int kCols = Rhs::Cell::kWidth * Rhs::kCells; member
Doutput.h46 static constexpr int kCols = InputType::kCols; member
52 using OutputType = RegisterBlock<OutputScalarType, kRows, kCols>;
/external/skia/gm/
Dlabyrinth.cpp39 constexpr static bool kCols[13][10] = { in draw_labyrinth() local
64 for (size_t x = 0; x < SK_ARRAY_COUNT(kCols); ++x) { in draw_labyrinth()
65 for (size_t y = 0; y < SK_ARRAY_COUNT(kCols[0]); ++y) { in draw_labyrinth()
66 if (kCols[x][y]) { in draw_labyrinth()
Dcomplexclip2.cpp45 fTotalWidth = kCols * fWidth + SK_Scalar1 * (kCols + 1) * kPadX; in ComplexClip2GM()
100 for (int j = 0; j < kCols; ++j) { in onOnceBeforeDraw()
109 static constexpr int kCols = 5; member in skiagm::ComplexClip2GM
152 for (int j = 0; j < kCols; ++j) { in onDraw()
206 SkClipOp fOps[kRows * kCols][5];
/external/skqp/gm/
Dcomplexclip2.cpp38 fTotalWidth = kCols * fWidth + SK_Scalar1 * (kCols + 1) * kPadX; in ComplexClip2GM()
97 for (int j = 0; j < kCols; ++j) { in onOnceBeforeDraw()
106 static constexpr int kCols = 5; member in skiagm::ComplexClip2GM
149 for (int j = 0; j < kCols; ++j) { in onDraw()
203 SkClipOp fOps[kRows * kCols][5];
/external/gemmlowp/standalone/
Dneon-gemm-kernel-benchmark.cc240 static const int kCols = Rhs::Cell::kWidth * Rhs::kCells; member