Home
last modified time | relevance | path

Searched refs:num_coeffs (Results 1 – 4 of 4) sorted by relevance

/external/eigen/unsupported/Eigen/CXX11/src/Tensor/
DTensorReductionCuda.h125 __global__ void FullReductionKernel(Reducer reducer, const Self input, Index num_coeffs, in FullReductionKernel() argument
161 Index max_iter = numext::mini<Index>(num_coeffs - first_index, NumPerThread*BlockSize); in FullReductionKernel()
164 eigen_assert(index < num_coeffs); in FullReductionKernel()
191 …nInitFullReduxKernelHalfFloat(Reducer reducer, const Self input, Index num_coeffs, half2* scratch)… in ReductionInitFullReduxKernelHalfFloat() argument
194 if (num_coeffs % 2 != 0) { in ReductionInitFullReduxKernelHalfFloat()
195 half last = input.m_impl.coeff(num_coeffs-1); in ReductionInitFullReduxKernelHalfFloat()
204 __global__ void ReductionInitKernelHalfFloat(Reducer reducer, const Self input, Index num_coeffs, h… in ReductionInitKernelHalfFloat() argument
207 const Index num_packets = num_coeffs / 2; in ReductionInitKernelHalfFloat()
212 if (thread_id == 0 && num_coeffs % 2 != 0) { in ReductionInitKernelHalfFloat()
213 output[num_coeffs-1] = reducer.initialize(); in ReductionInitKernelHalfFloat()
[all …]
DTensorReduction.h223 const typename Self::Index num_coeffs = array_prod(self.m_impl.dimensions());
224 *output = InnerMostDimReducer<Self, Op, Vectorizable>::reduce(self, 0, num_coeffs, reducer);
253 const Index num_coeffs = array_prod(self.m_impl.dimensions());
254 if (num_coeffs == 0) {
263 num_coeffs, cost, device.numThreads());
266 InnerMostDimReducer<Self, Op, Vectorizable>::reduce(self, 0, num_coeffs, reducer);
270 std::floor<Index>(static_cast<float>(num_coeffs) / num_threads);
271 const Index numblocks = blocksize > 0 ? num_coeffs / blocksize : 0;
272 eigen_assert(num_coeffs >= numblocks * blocksize);
282 if (numblocks * blocksize < num_coeffs) {
[all …]
/external/mesa3d/src/gallium/auxiliary/gallivm/
Dlp_bld_arit.h311 unsigned num_coeffs);
Dlp_bld_arit.c3197 unsigned num_coeffs) in lp_build_polynomial() argument
3221 for (i = num_coeffs; i--; ) { in lp_build_polynomial()