Searched refs:num_coeffs (Results 1 – 4 of 4) sorted by relevance
/external/eigen/unsupported/Eigen/CXX11/src/Tensor/ |
D | TensorReductionCuda.h | 125 __global__ void FullReductionKernel(Reducer reducer, const Self input, Index num_coeffs, in FullReductionKernel() argument 161 Index max_iter = numext::mini<Index>(num_coeffs - first_index, NumPerThread*BlockSize); in FullReductionKernel() 164 eigen_assert(index < num_coeffs); in FullReductionKernel() 191 …nInitFullReduxKernelHalfFloat(Reducer reducer, const Self input, Index num_coeffs, half2* scratch)… in ReductionInitFullReduxKernelHalfFloat() argument 194 if (num_coeffs % 2 != 0) { in ReductionInitFullReduxKernelHalfFloat() 195 half last = input.m_impl.coeff(num_coeffs-1); in ReductionInitFullReduxKernelHalfFloat() 204 __global__ void ReductionInitKernelHalfFloat(Reducer reducer, const Self input, Index num_coeffs, h… in ReductionInitKernelHalfFloat() argument 207 const Index num_packets = num_coeffs / 2; in ReductionInitKernelHalfFloat() 212 if (thread_id == 0 && num_coeffs % 2 != 0) { in ReductionInitKernelHalfFloat() 213 output[num_coeffs-1] = reducer.initialize(); in ReductionInitKernelHalfFloat() [all …]
|
D | TensorReduction.h | 223 const typename Self::Index num_coeffs = array_prod(self.m_impl.dimensions()); 224 *output = InnerMostDimReducer<Self, Op, Vectorizable>::reduce(self, 0, num_coeffs, reducer); 253 const Index num_coeffs = array_prod(self.m_impl.dimensions()); 254 if (num_coeffs == 0) { 263 num_coeffs, cost, device.numThreads()); 266 InnerMostDimReducer<Self, Op, Vectorizable>::reduce(self, 0, num_coeffs, reducer); 270 std::floor<Index>(static_cast<float>(num_coeffs) / num_threads); 271 const Index numblocks = blocksize > 0 ? num_coeffs / blocksize : 0; 272 eigen_assert(num_coeffs >= numblocks * blocksize); 282 if (numblocks * blocksize < num_coeffs) { [all …]
|
/external/mesa3d/src/gallium/auxiliary/gallivm/ |
D | lp_bld_arit.h | 311 unsigned num_coeffs);
|
D | lp_bld_arit.c | 3197 unsigned num_coeffs) in lp_build_polynomial() argument 3221 for (i = num_coeffs; i--; ) { in lp_build_polynomial()
|