Home
last modified time | relevance | path

Searched refs:grid_dim (Results 1 – 5 of 5) sorted by relevance

/external/tensorflow/tensorflow/core/kernels/
Dreduction_gpu_kernels.cu.h773 dim3 grid_dim(1,
778 grid_dim.y = std::min((int)grid_dim.y, TF_RED_WARPSIZE);
780 if (grid_dim.y > 2 && grid_dim.y < TF_RED_WARPSIZE) {
781 int log2 = Log2Floor(grid_dim.y);
782 grid_dim.y = 1 << log2;
785 if (grid_dim.y == 1) {
787 grid_dim, block_dim, 0, cu_stream, in, out,
794 sizeof(T) * extent_y * grid_dim.y)}),
797 grid_dim, block_dim, 0, cu_stream, in,
802 (grid_dim.y * extent_y + (TF_RED_WARPSIZE - 1)) / TF_RED_WARPSIZE, 1,
[all …]
/external/tensorflow/tensorflow/core/util/
Dgpu_kernel_helper.h100 Status GpuLaunchKernel(void (*function)(Ts...), dim3 grid_dim, dim3 block_dim, in GpuLaunchKernel() argument
110 auto result = cudaLaunchKernel(func_ptr, grid_dim, block_dim, arg_ptrs.data(), in GpuLaunchKernel()
116 hipLaunchKernelGGL(function, grid_dim, block_dim, shared_memory_size_bytes, in GpuLaunchKernel()
/external/mesa3d/src/gallium/drivers/llvmpipe/
Dlp_screen.c479 uint32_t *grid_dim = ret; in llvmpipe_get_compute_param() local
480 *grid_dim = 3; in llvmpipe_get_compute_param()
/external/tensorflow/tensorflow/compiler/xla/g3doc/
Dcustom_call.md78 const int64 grid_dim = 2048 / block_dim;
79 custom_call_kernel<<<grid_dim, block_dim,
/external/tensorflow/tensorflow/core/kernels/rnn/
Dlstm_ops_gpu.cu.cc248 const int grid_dim = in LSTMBlockCellFpropWithCUDA() local
250 TF_CHECK_OK(GpuLaunchKernel(concat_xh<T>, grid_dim, block_dim, 0, cu_stream, in LSTMBlockCellFpropWithCUDA()