Home
last modified time | relevance | path

Searched refs:kThreadsPerBlock (Results 1 – 3 of 3) sorted by relevance

/external/tensorflow/tensorflow/core/kernels/
Dmaxpooling_op_gpu.cu.cc360 const int kThreadsPerBlock = 1024; in operator ()() local
365 (output_size + kThreadsPerBlock - 1) / kThreadsPerBlock, kThreadsPerBlock, in operator ()()
381 const int kThreadsPerBlock = 1024; in operator ()() local
387 (output_size + kThreadsPerBlock - 1) / kThreadsPerBlock, in operator ()()
388 kThreadsPerBlock, 0, d.stream(), output_size, in operator ()()
395 (output_size + kThreadsPerBlock - 1) / kThreadsPerBlock, in operator ()()
396 kThreadsPerBlock, 0, d.stream(), output_size, in operator ()()
410 const int kThreadsPerBlock = 1024; in operator ()() local
413 SetZero<T>, (input_size + kThreadsPerBlock - 1) / kThreadsPerBlock, in operator ()()
414 kThreadsPerBlock, 0, d.stream(), input_size, bottom_diff)); in operator ()()
[all …]
/external/tensorflow/tensorflow/core/util/
Dgpu_launch_config.h234 const int kThreadsPerBlock = 256; in GetGpu2DLaunchConfig() local
235 int block_cols = std::min(xdim, kThreadsPerBlock); in GetGpu2DLaunchConfig()
237 int block_rows = std::max(kThreadsPerBlock / block_cols, 1); in GetGpu2DLaunchConfig()
242 const int max_blocks = std::max(physical_thread_count / kThreadsPerBlock, 1); in GetGpu2DLaunchConfig()
/external/tensorflow/tensorflow/compiler/xla/service/gpu/
Dir_emitter_unnested.cc2950 const uint64 kThreadsPerBlock = kTileSize / 2; in EmitSortFromMlir() local
2963 kThreadsPerBlock > in EmitSortFromMlir()
2972 context.name, (no_tiling ? "won't" : "will"), kTileSize, kThreadsPerBlock, in EmitSortFromMlir()
2977 uint64 num_blocks = CeilOfRatio(num_iterations, kThreadsPerBlock); in EmitSortFromMlir()
2978 LaunchDimensions tiled_launch_dimensions(num_blocks, kThreadsPerBlock); in EmitSortFromMlir()
2980 context.name, num_blocks, kThreadsPerBlock); in EmitSortFromMlir()