Home
last modified time | relevance | path

Searched refs:CudaAtomicAdd (Results 1 – 15 of 15) sorted by relevance

/external/tensorflow/tensorflow/core/util/
Dcuda_device_functions.h486 __device__ detail::ToTypeIfConvertible<U, T> CudaAtomicAdd(T* ptr, U value) { in CudaAtomicAdd() function
490 __device__ inline Eigen::half CudaAtomicAdd(Eigen::half* ptr, in CudaAtomicAdd() function
498 __device__ inline double CudaAtomicAdd(double* ptr, double value) { in CudaAtomicAdd() function
505 __device__ inline double CudaAtomicAdd(double* ptr, double value) { in CudaAtomicAdd() function
520 __device__ inline std::complex<float> CudaAtomicAdd(std::complex<float>* ptr, in CudaAtomicAdd() function
523 return std::complex<float>(CudaAtomicAdd(ptr_scalar, value.real()), in CudaAtomicAdd()
524 CudaAtomicAdd(ptr_scalar + 1, value.imag())); in CudaAtomicAdd()
527 __device__ inline std::complex<double> CudaAtomicAdd( in CudaAtomicAdd() function
530 return std::complex<double>(CudaAtomicAdd(ptr_scalar, value.real()), in CudaAtomicAdd()
531 CudaAtomicAdd(ptr_scalar + 1, value.imag())); in CudaAtomicAdd()
[all …]
Dcuda_kernel_helper_test.cu.cc100 CudaAtomicAdd(failure_count, 1); in CudaShuffleGetSrcLaneTest()
/external/tensorflow/tensorflow/core/kernels/
Dresize_bilinear_op_gpu.cu.cc120 CudaAtomicAdd(output_grad + in ResizeBilinearGradKernel()
126 CudaAtomicAdd(output_grad + in ResizeBilinearGradKernel()
134 CudaAtomicAdd(output_grad + in ResizeBilinearGradKernel()
140 CudaAtomicAdd(output_grad + in ResizeBilinearGradKernel()
231 CudaAtomicAdd(output_grad + in LegacyResizeBilinearGradKernel()
237 CudaAtomicAdd(output_grad + in LegacyResizeBilinearGradKernel()
245 CudaAtomicAdd(output_grad + in LegacyResizeBilinearGradKernel()
251 CudaAtomicAdd(output_grad + in LegacyResizeBilinearGradKernel()
Dcrop_and_resize_op_gpu.cu.cc188 CudaAtomicAdd(grads_image_ptr + in CropAndResizeBackpropImageKernel()
194 CudaAtomicAdd(grads_image_ptr + in CropAndResizeBackpropImageKernel()
202 CudaAtomicAdd(grads_image_ptr + in CropAndResizeBackpropImageKernel()
208 CudaAtomicAdd(grads_image_ptr + in CropAndResizeBackpropImageKernel()
217 CudaAtomicAdd(grads_image_ptr + in CropAndResizeBackpropImageKernel()
336 CudaAtomicAdd(grads_boxes_ptr + b * 4 + 0, dy1); in CropAndResizeBackpropBoxesKernel()
337 CudaAtomicAdd(grads_boxes_ptr + b * 4 + 1, dx1); in CropAndResizeBackpropBoxesKernel()
338 CudaAtomicAdd(grads_boxes_ptr + b * 4 + 2, dy2); in CropAndResizeBackpropBoxesKernel()
339 CudaAtomicAdd(grads_boxes_ptr + b * 4 + 3, dx2); in CropAndResizeBackpropBoxesKernel()
Dbias_op_gpu.cu.cc106 CudaAtomicAdd(bias_backprop + bias_offset, ldg(output_backprop + index)); in BiasGradNHWC_Naive()
118 CudaAtomicAdd(bias_backprop + bias_offset, ldg(output_backprop + index)); in BiasGradNCHW_Naive()
138 CudaAtomicAdd(s_data + bias_offset, AccT(ldg(output_backprop + index))); in BiasGradNHWC_SharedAtomics()
143 CudaAtomicAdd(bias_backprop + index, T(s_data[index])); in BiasGradNHWC_SharedAtomics()
179 CudaAtomicAdd(s_data + bias_offset, sum); in BiasGradNCHW_SharedAtomics()
191 CudaAtomicAdd(bias_backprop + bias_index, T(data)); in BiasGradNCHW_SharedAtomics()
Dscatter_nd_op_gpu.cu.cc47 CudaAtomicAdd(out, val); in operator ()()
66 CudaAtomicAdd(ptr, val.real()); in operator ()()
67 CudaAtomicAdd(ptr, val.imag()); in operator ()()
Dsparse_tensor_dense_matmul_op_gpu.cu.cc50 CudaAtomicAdd(out_location, std::numeric_limits<T>::quiet_NaN()); in SparseTensorDenseMatMulKernel()
59 CudaAtomicAdd(out_location, a_value * b_value); in SparseTensorDenseMatMulKernel()
Dsegment_reduction_ops_gpu.cu.cc85 CudaAtomicAdd(output + output_index, sum); in SortedSegmentSumCustomKernel()
100 CudaAtomicAdd(output + output_index, sum); in SortedSegmentSumCustomKernel()
Dresize_nearest_neighbor_op_gpu.cu.cc122 CudaAtomicAdd(bottom_diff_n + idx, ldg(top_diff + index)); in ResizeNearestNeighborBackwardNHWC()
151 CudaAtomicAdd(bottom_diff_n + idx, ldg(top_diff + index)); in LegacyResizeNearestNeighborBackwardNHWC()
Dsegment_reduction_ops.h89 CudaAtomicAdd(dest, value); in operator()
Ddilation_ops_gpu.cu.cc120 CudaAtomicAdd( in DilationBackpropInputKernel()
169 CudaAtomicAdd( in DilationBackpropFilterKernel()
Dscatter_functor_gpu.cu.h44 __device__ void operator()(T* dest, T src) const { CudaAtomicAdd(dest, src); }
Dmaxpooling_op_gpu.cu.cc214 CudaAtomicAdd(bottom_diff + n * height * width * channels + maxidx, in MaxPoolBackwardNoMaskNHWC()
247 CudaAtomicAdd(bottom_diff + offset + mask[index], top_diff[index]); in MaxPoolBackward()
Ddepthwise_conv_op_gpu.h1096 CudaAtomicAdd(addr, partial_sum);
1127 CudaAtomicAdd(addr, partial_sum);
1308 CudaAtomicAdd(filter_offset + filter, static_cast<T>(val));
1384 CudaAtomicAdd(addr, partial_sum);
1416 CudaAtomicAdd(addr, partial_sum);
1576 CudaAtomicAdd(filter_offset + filter, static_cast<T>(val));
Dsvd_op_gpu.cu.cc69 CudaAtomicAdd(V + batch, v); in ComputeValueOfVKernel()